Changeset View
Changeset View
Standalone View
Standalone View
clang/test/OpenMP/nvptx_target_codegen.cpp
Show First 20 Lines • Show All 159 Lines • ▼ Show 20 Lines | |||||
// CHECK1-NEXT: [[TMP2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2:[0-9]+]]) | // CHECK1-NEXT: [[TMP2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2:[0-9]+]]) | ||||
// CHECK1-NEXT: [[TMP3:%.*]] = getelementptr inbounds [2 x i8*], [2 x i8*]* [[CAPTURED_VARS_ADDRS]], i64 0, i64 0 | // CHECK1-NEXT: [[TMP3:%.*]] = getelementptr inbounds [2 x i8*], [2 x i8*]* [[CAPTURED_VARS_ADDRS]], i64 0, i64 0 | ||||
// CHECK1-NEXT: [[TMP4:%.*]] = bitcast i32** [[PTR1_ADDR]] to i8* | // CHECK1-NEXT: [[TMP4:%.*]] = bitcast i32** [[PTR1_ADDR]] to i8* | ||||
// CHECK1-NEXT: store i8* [[TMP4]], i8** [[TMP3]], align 8 | // CHECK1-NEXT: store i8* [[TMP4]], i8** [[TMP3]], align 8 | ||||
// CHECK1-NEXT: [[TMP5:%.*]] = getelementptr inbounds [2 x i8*], [2 x i8*]* [[CAPTURED_VARS_ADDRS]], i64 0, i64 1 | // CHECK1-NEXT: [[TMP5:%.*]] = getelementptr inbounds [2 x i8*], [2 x i8*]* [[CAPTURED_VARS_ADDRS]], i64 0, i64 1 | ||||
// CHECK1-NEXT: [[TMP6:%.*]] = bitcast i32** [[TMP0]] to i8* | // CHECK1-NEXT: [[TMP6:%.*]] = bitcast i32** [[TMP0]] to i8* | ||||
// CHECK1-NEXT: store i8* [[TMP6]], i8** [[TMP5]], align 8 | // CHECK1-NEXT: store i8* [[TMP6]], i8** [[TMP5]], align 8 | ||||
// CHECK1-NEXT: [[TMP7:%.*]] = bitcast [2 x i8*]* [[CAPTURED_VARS_ADDRS]] to i8** | // CHECK1-NEXT: [[TMP7:%.*]] = bitcast [2 x i8*]* [[CAPTURED_VARS_ADDRS]] to i8** | ||||
// CHECK1-NEXT: call void @__kmpc_parallel_51(%struct.ident_t* @[[GLOB2]], i32 [[TMP2]], i32 1, i32 -1, i32 -1, i8* bitcast (void (i32*, i32*, i32**, i32**)* @__omp_outlined__ to i8*), i8* null, i8** [[TMP7]], i64 2) | // CHECK1-NEXT: call void @__kmpc_parallel_51(%struct.ident_t* @[[GLOB2]], i32 [[TMP2]], i32 1, i32 2, i32 -1, i8* bitcast (void (i32*, i32*, i32**, i32**)* @__omp_outlined__ to i8*), i8* null, i8** [[TMP7]], i64 2) | ||||
// CHECK1-NEXT: call void @__kmpc_target_deinit(%struct.ident_t* @[[GLOB1]], i8 2, i1 true) | // CHECK1-NEXT: call void @__kmpc_target_deinit(%struct.ident_t* @[[GLOB1]], i8 2, i1 true) | ||||
// CHECK1-NEXT: ret void | // CHECK1-NEXT: ret void | ||||
// CHECK1: worker.exit: | // CHECK1: worker.exit: | ||||
// CHECK1-NEXT: ret void | // CHECK1-NEXT: ret void | ||||
// | // | ||||
// | // | ||||
// CHECK1-LABEL: define {{[^@]+}}@__omp_outlined__ | // CHECK1-LABEL: define {{[^@]+}}@__omp_outlined__ | ||||
// CHECK1-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32** nonnull align 8 dereferenceable(8) [[PTR1:%.*]], i32** nonnull align 8 dereferenceable(8) [[PTR2:%.*]]) #[[ATTR1:[0-9]+]] { | // CHECK1-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32** nonnull align 8 dereferenceable(8) [[PTR1:%.*]], i32** nonnull align 8 dereferenceable(8) [[PTR2:%.*]]) #[[ATTR1:[0-9]+]] { | ||||
▲ Show 20 Lines • Show All 119 Lines • ▼ Show 20 Lines | |||||
// CHECK1-NEXT: [[ADD18:%.*]] = add nsw i64 [[TMP15]], 1 | // CHECK1-NEXT: [[ADD18:%.*]] = add nsw i64 [[TMP15]], 1 | ||||
// CHECK1-NEXT: store i64 [[ADD18]], i64* [[X]], align 8 | // CHECK1-NEXT: store i64 [[ADD18]], i64* [[X]], align 8 | ||||
// CHECK1-NEXT: [[Y:%.*]] = getelementptr inbounds [[STRUCT_TT]], %struct.TT* [[TMP7]], i32 0, i32 1 | // CHECK1-NEXT: [[Y:%.*]] = getelementptr inbounds [[STRUCT_TT]], %struct.TT* [[TMP7]], i32 0, i32 1 | ||||
// CHECK1-NEXT: [[TMP16:%.*]] = load i8, i8* [[Y]], align 8 | // CHECK1-NEXT: [[TMP16:%.*]] = load i8, i8* [[Y]], align 8 | ||||
// CHECK1-NEXT: [[CONV19:%.*]] = sext i8 [[TMP16]] to i32 | // CHECK1-NEXT: [[CONV19:%.*]] = sext i8 [[TMP16]] to i32 | ||||
// CHECK1-NEXT: [[ADD20:%.*]] = add nsw i32 [[CONV19]], 1 | // CHECK1-NEXT: [[ADD20:%.*]] = add nsw i32 [[CONV19]], 1 | ||||
// CHECK1-NEXT: [[CONV21:%.*]] = trunc i32 [[ADD20]] to i8 | // CHECK1-NEXT: [[CONV21:%.*]] = trunc i32 [[ADD20]] to i8 | ||||
// CHECK1-NEXT: store i8 [[CONV21]], i8* [[Y]], align 8 | // CHECK1-NEXT: store i8 [[CONV21]], i8* [[Y]], align 8 | ||||
// CHECK1-NEXT: [[CALL:%.*]] = call nonnull align 8 dereferenceable(8) i64* @_ZN2TTIxcEixEi(%struct.TT* nonnull align 8 dereferenceable(16) [[TMP7]], i32 0) #[[ATTR6:[0-9]+]] | // CHECK1-NEXT: [[CALL:%.*]] = call nonnull align 8 dereferenceable(8) i64* @_ZN2TTIxcEixEi(%struct.TT* nonnull align 8 dereferenceable(16) [[TMP7]], i32 0) #[[ATTR8:[0-9]+]] | ||||
// CHECK1-NEXT: [[TMP17:%.*]] = load i64, i64* [[CALL]], align 8 | // CHECK1-NEXT: [[TMP17:%.*]] = load i64, i64* [[CALL]], align 8 | ||||
// CHECK1-NEXT: [[ADD22:%.*]] = add nsw i64 [[TMP17]], 1 | // CHECK1-NEXT: [[ADD22:%.*]] = add nsw i64 [[TMP17]], 1 | ||||
// CHECK1-NEXT: store i64 [[ADD22]], i64* [[CALL]], align 8 | // CHECK1-NEXT: store i64 [[ADD22]], i64* [[CALL]], align 8 | ||||
// CHECK1-NEXT: call void @__kmpc_target_deinit(%struct.ident_t* @[[GLOB1]], i8 1, i1 true) | // CHECK1-NEXT: call void @__kmpc_target_deinit(%struct.ident_t* @[[GLOB1]], i8 1, i1 true) | ||||
// CHECK1-NEXT: ret void | // CHECK1-NEXT: ret void | ||||
// CHECK1: worker.exit: | // CHECK1: worker.exit: | ||||
// CHECK1-NEXT: ret void | // CHECK1-NEXT: ret void | ||||
// | // | ||||
// | // | ||||
// CHECK1-LABEL: define {{[^@]+}}@_ZN2TTIxcEixEi | // CHECK1-LABEL: define {{[^@]+}}@_ZN2TTIxcEixEi | ||||
// CHECK1-SAME: (%struct.TT* nonnull align 8 dereferenceable(16) [[THIS:%.*]], i32 [[I:%.*]]) #[[ATTR3:[0-9]+]] comdat align 2 { | // CHECK1-SAME: (%struct.TT* nonnull align 8 dereferenceable(16) [[THIS:%.*]], i32 [[I:%.*]]) #[[ATTR4:[0-9]+]] comdat align 2 { | ||||
// CHECK1-NEXT: entry: | // CHECK1-NEXT: entry: | ||||
// CHECK1-NEXT: [[THIS_ADDR:%.*]] = alloca %struct.TT*, align 8 | // CHECK1-NEXT: [[THIS_ADDR:%.*]] = alloca %struct.TT*, align 8 | ||||
// CHECK1-NEXT: [[I_ADDR:%.*]] = alloca i32, align 4 | // CHECK1-NEXT: [[I_ADDR:%.*]] = alloca i32, align 4 | ||||
// CHECK1-NEXT: store %struct.TT* [[THIS]], %struct.TT** [[THIS_ADDR]], align 8 | // CHECK1-NEXT: store %struct.TT* [[THIS]], %struct.TT** [[THIS_ADDR]], align 8 | ||||
// CHECK1-NEXT: store i32 [[I]], i32* [[I_ADDR]], align 4 | // CHECK1-NEXT: store i32 [[I]], i32* [[I_ADDR]], align 4 | ||||
// CHECK1-NEXT: [[THIS1:%.*]] = load %struct.TT*, %struct.TT** [[THIS_ADDR]], align 8 | // CHECK1-NEXT: [[THIS1:%.*]] = load %struct.TT*, %struct.TT** [[THIS_ADDR]], align 8 | ||||
// CHECK1-NEXT: [[X:%.*]] = getelementptr inbounds [[STRUCT_TT:%.*]], %struct.TT* [[THIS1]], i32 0, i32 0 | // CHECK1-NEXT: [[X:%.*]] = getelementptr inbounds [[STRUCT_TT:%.*]], %struct.TT* [[THIS1]], i32 0, i32 0 | ||||
// CHECK1-NEXT: ret i64* [[X]] | // CHECK1-NEXT: ret i64* [[X]] | ||||
▲ Show 20 Lines • Show All 76 Lines • ▼ Show 20 Lines | |||||
// CHECK1-NEXT: [[TMP7:%.*]] = mul nsw i64 1, [[TMP2]] | // CHECK1-NEXT: [[TMP7:%.*]] = mul nsw i64 1, [[TMP2]] | ||||
// CHECK1-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i16, i16* [[TMP3]], i64 [[TMP7]] | // CHECK1-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i16, i16* [[TMP3]], i64 [[TMP7]] | ||||
// CHECK1-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds i16, i16* [[ARRAYIDX]], i64 1 | // CHECK1-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds i16, i16* [[ARRAYIDX]], i64 1 | ||||
// CHECK1-NEXT: store i16 [[CONV5]], i16* [[ARRAYIDX6]], align 2 | // CHECK1-NEXT: store i16 [[CONV5]], i16* [[ARRAYIDX6]], align 2 | ||||
// CHECK1-NEXT: [[A7:%.*]] = getelementptr inbounds [[STRUCT_S1]], %struct.S1* [[TMP0]], i32 0, i32 0 | // CHECK1-NEXT: [[A7:%.*]] = getelementptr inbounds [[STRUCT_S1]], %struct.S1* [[TMP0]], i32 0, i32 0 | ||||
// CHECK1-NEXT: [[TMP8:%.*]] = load double, double* [[A7]], align 8 | // CHECK1-NEXT: [[TMP8:%.*]] = load double, double* [[A7]], align 8 | ||||
// CHECK1-NEXT: [[CONV8:%.*]] = fptosi double [[TMP8]] to i32 | // CHECK1-NEXT: [[CONV8:%.*]] = fptosi double [[TMP8]] to i32 | ||||
// CHECK1-NEXT: [[A9:%.*]] = getelementptr inbounds [[STRUCT_S1]], %struct.S1* [[TMP0]], i32 0, i32 0 | // CHECK1-NEXT: [[A9:%.*]] = getelementptr inbounds [[STRUCT_S1]], %struct.S1* [[TMP0]], i32 0, i32 0 | ||||
// CHECK1-NEXT: [[CALL:%.*]] = call i32 @_Z3baziRd(i32 [[CONV8]], double* nonnull align 8 dereferenceable(8) [[A9]]) #[[ATTR6]] | // CHECK1-NEXT: [[CALL:%.*]] = call i32 @_Z3baziRd(i32 [[CONV8]], double* nonnull align 8 dereferenceable(8) [[A9]]) #[[ATTR8]] | ||||
// CHECK1-NEXT: call void @__kmpc_target_deinit(%struct.ident_t* @[[GLOB1]], i8 1, i1 true) | // CHECK1-NEXT: call void @__kmpc_target_deinit(%struct.ident_t* @[[GLOB1]], i8 1, i1 true) | ||||
// CHECK1-NEXT: ret void | // CHECK1-NEXT: ret void | ||||
// CHECK1: worker.exit: | // CHECK1: worker.exit: | ||||
// CHECK1-NEXT: ret void | // CHECK1-NEXT: ret void | ||||
// | // | ||||
// | // | ||||
// CHECK1-LABEL: define {{[^@]+}}@_Z3baziRd | // CHECK1-LABEL: define {{[^@]+}}@_Z3baziRd | ||||
// CHECK1-SAME: (i32 [[F1:%.*]], double* nonnull align 8 dereferenceable(8) [[A:%.*]]) #[[ATTR3]] { | // CHECK1-SAME: (i32 [[F1:%.*]], double* nonnull align 8 dereferenceable(8) [[A:%.*]]) #[[ATTR4]] { | ||||
// CHECK1-NEXT: entry: | // CHECK1-NEXT: entry: | ||||
// CHECK1-NEXT: [[A_ADDR:%.*]] = alloca double*, align 8 | // CHECK1-NEXT: [[A_ADDR:%.*]] = alloca double*, align 8 | ||||
// CHECK1-NEXT: [[CAPTURED_VARS_ADDRS:%.*]] = alloca [2 x i8*], align 8 | // CHECK1-NEXT: [[CAPTURED_VARS_ADDRS:%.*]] = alloca [2 x i8*], align 8 | ||||
// CHECK1-NEXT: [[TMP0:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB3:[0-9]+]]) | // CHECK1-NEXT: [[TMP0:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB3:[0-9]+]]) | ||||
// CHECK1-NEXT: [[F:%.*]] = call i8* @__kmpc_alloc_shared(i64 4) | // CHECK1-NEXT: [[F:%.*]] = call i8* @__kmpc_alloc_shared(i64 4) | ||||
// CHECK1-NEXT: [[F_ON_STACK:%.*]] = bitcast i8* [[F]] to i32* | // CHECK1-NEXT: [[F_ON_STACK:%.*]] = bitcast i8* [[F]] to i32* | ||||
// CHECK1-NEXT: store i32 [[F1]], i32* [[F_ON_STACK]], align 4 | // CHECK1-NEXT: store i32 [[F1]], i32* [[F_ON_STACK]], align 4 | ||||
// CHECK1-NEXT: store double* [[A]], double** [[A_ADDR]], align 8 | // CHECK1-NEXT: store double* [[A]], double** [[A_ADDR]], align 8 | ||||
Show All 13 Lines | |||||
// | // | ||||
// CHECK1-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z16unreachable_callv_l142 | // CHECK1-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z16unreachable_callv_l142 | ||||
// CHECK1-SAME: () #[[ATTR1]] { | // CHECK1-SAME: () #[[ATTR1]] { | ||||
// CHECK1-NEXT: entry: | // CHECK1-NEXT: entry: | ||||
// CHECK1-NEXT: [[TMP0:%.*]] = call i32 @__kmpc_target_init(%struct.ident_t* @[[GLOB1]], i8 1, i1 true, i1 true) | // CHECK1-NEXT: [[TMP0:%.*]] = call i32 @__kmpc_target_init(%struct.ident_t* @[[GLOB1]], i8 1, i1 true, i1 true) | ||||
// CHECK1-NEXT: [[EXEC_USER_CODE:%.*]] = icmp eq i32 [[TMP0]], -1 | // CHECK1-NEXT: [[EXEC_USER_CODE:%.*]] = icmp eq i32 [[TMP0]], -1 | ||||
// CHECK1-NEXT: br i1 [[EXEC_USER_CODE]], label [[USER_CODE_ENTRY:%.*]], label [[WORKER_EXIT:%.*]] | // CHECK1-NEXT: br i1 [[EXEC_USER_CODE]], label [[USER_CODE_ENTRY:%.*]], label [[WORKER_EXIT:%.*]] | ||||
// CHECK1: user_code.entry: | // CHECK1: user_code.entry: | ||||
// CHECK1-NEXT: call void @_Z6asserti(i32 0) #[[ATTR7:[0-9]+]] | // CHECK1-NEXT: call void @_Z6asserti(i32 0) #[[ATTR9:[0-9]+]] | ||||
// CHECK1-NEXT: unreachable | // CHECK1-NEXT: unreachable | ||||
// CHECK1: worker.exit: | // CHECK1: worker.exit: | ||||
// CHECK1-NEXT: ret void | // CHECK1-NEXT: ret void | ||||
// CHECK1: 1: | // CHECK1: 1: | ||||
// CHECK1-NEXT: call void @__kmpc_target_deinit(%struct.ident_t* @[[GLOB1]], i8 1, i1 true) | // CHECK1-NEXT: call void @__kmpc_target_deinit(%struct.ident_t* @[[GLOB1]], i8 1, i1 true) | ||||
// CHECK1-NEXT: ret void | // CHECK1-NEXT: ret void | ||||
// | // | ||||
// | // | ||||
▲ Show 20 Lines • Show All 50 Lines • ▼ Show 20 Lines | |||||
// CHECK1-NEXT: [[TMP3:%.*]] = load double, double* [[TMP2]], align 8 | // CHECK1-NEXT: [[TMP3:%.*]] = load double, double* [[TMP2]], align 8 | ||||
// CHECK1-NEXT: [[ADD:%.*]] = fadd double 2.000000e+00, [[TMP3]] | // CHECK1-NEXT: [[ADD:%.*]] = fadd double 2.000000e+00, [[TMP3]] | ||||
// CHECK1-NEXT: [[CONV:%.*]] = fptosi double [[ADD]] to i32 | // CHECK1-NEXT: [[CONV:%.*]] = fptosi double [[ADD]] to i32 | ||||
// CHECK1-NEXT: store i32 [[CONV]], i32* [[TMP0]], align 4 | // CHECK1-NEXT: store i32 [[CONV]], i32* [[TMP0]], align 4 | ||||
// CHECK1-NEXT: ret void | // CHECK1-NEXT: ret void | ||||
// | // | ||||
// | // | ||||
// CHECK1-LABEL: define {{[^@]+}}@__omp_outlined__1_wrapper | // CHECK1-LABEL: define {{[^@]+}}@__omp_outlined__1_wrapper | ||||
// CHECK1-SAME: (i16 zeroext [[TMP0:%.*]], i32 [[TMP1:%.*]]) #[[ATTR5:[0-9]+]] { | // CHECK1-SAME: (i16 zeroext [[TMP0:%.*]], i32 [[TMP1:%.*]]) #[[ATTR7:[0-9]+]] { | ||||
// CHECK1-NEXT: entry: | // CHECK1-NEXT: entry: | ||||
// CHECK1-NEXT: [[DOTADDR:%.*]] = alloca i16, align 2 | // CHECK1-NEXT: [[DOTADDR:%.*]] = alloca i16, align 2 | ||||
// CHECK1-NEXT: [[DOTADDR1:%.*]] = alloca i32, align 4 | // CHECK1-NEXT: [[DOTADDR1:%.*]] = alloca i32, align 4 | ||||
// CHECK1-NEXT: [[DOTZERO_ADDR:%.*]] = alloca i32, align 4 | // CHECK1-NEXT: [[DOTZERO_ADDR:%.*]] = alloca i32, align 4 | ||||
// CHECK1-NEXT: [[GLOBAL_ARGS:%.*]] = alloca i8**, align 8 | // CHECK1-NEXT: [[GLOBAL_ARGS:%.*]] = alloca i8**, align 8 | ||||
// CHECK1-NEXT: store i16 [[TMP0]], i16* [[DOTADDR]], align 2 | // CHECK1-NEXT: store i16 [[TMP0]], i16* [[DOTADDR]], align 2 | ||||
// CHECK1-NEXT: store i32 [[TMP1]], i32* [[DOTADDR1]], align 4 | // CHECK1-NEXT: store i32 [[TMP1]], i32* [[DOTADDR1]], align 4 | ||||
// CHECK1-NEXT: store i32 0, i32* [[DOTZERO_ADDR]], align 4 | // CHECK1-NEXT: store i32 0, i32* [[DOTZERO_ADDR]], align 4 | ||||
Show All 25 Lines | |||||
// CHECK2-NEXT: [[TMP2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2:[0-9]+]]) | // CHECK2-NEXT: [[TMP2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2:[0-9]+]]) | ||||
// CHECK2-NEXT: [[TMP3:%.*]] = getelementptr inbounds [2 x i8*], [2 x i8*]* [[CAPTURED_VARS_ADDRS]], i32 0, i32 0 | // CHECK2-NEXT: [[TMP3:%.*]] = getelementptr inbounds [2 x i8*], [2 x i8*]* [[CAPTURED_VARS_ADDRS]], i32 0, i32 0 | ||||
// CHECK2-NEXT: [[TMP4:%.*]] = bitcast i32** [[PTR1_ADDR]] to i8* | // CHECK2-NEXT: [[TMP4:%.*]] = bitcast i32** [[PTR1_ADDR]] to i8* | ||||
// CHECK2-NEXT: store i8* [[TMP4]], i8** [[TMP3]], align 4 | // CHECK2-NEXT: store i8* [[TMP4]], i8** [[TMP3]], align 4 | ||||
// CHECK2-NEXT: [[TMP5:%.*]] = getelementptr inbounds [2 x i8*], [2 x i8*]* [[CAPTURED_VARS_ADDRS]], i32 0, i32 1 | // CHECK2-NEXT: [[TMP5:%.*]] = getelementptr inbounds [2 x i8*], [2 x i8*]* [[CAPTURED_VARS_ADDRS]], i32 0, i32 1 | ||||
// CHECK2-NEXT: [[TMP6:%.*]] = bitcast i32** [[TMP0]] to i8* | // CHECK2-NEXT: [[TMP6:%.*]] = bitcast i32** [[TMP0]] to i8* | ||||
// CHECK2-NEXT: store i8* [[TMP6]], i8** [[TMP5]], align 4 | // CHECK2-NEXT: store i8* [[TMP6]], i8** [[TMP5]], align 4 | ||||
// CHECK2-NEXT: [[TMP7:%.*]] = bitcast [2 x i8*]* [[CAPTURED_VARS_ADDRS]] to i8** | // CHECK2-NEXT: [[TMP7:%.*]] = bitcast [2 x i8*]* [[CAPTURED_VARS_ADDRS]] to i8** | ||||
// CHECK2-NEXT: call void @__kmpc_parallel_51(%struct.ident_t* @[[GLOB2]], i32 [[TMP2]], i32 1, i32 -1, i32 -1, i8* bitcast (void (i32*, i32*, i32**, i32**)* @__omp_outlined__ to i8*), i8* null, i8** [[TMP7]], i32 2) | // CHECK2-NEXT: call void @__kmpc_parallel_51(%struct.ident_t* @[[GLOB2]], i32 [[TMP2]], i32 1, i32 2, i32 -1, i8* bitcast (void (i32*, i32*, i32**, i32**)* @__omp_outlined__ to i8*), i8* null, i8** [[TMP7]], i32 2) | ||||
// CHECK2-NEXT: call void @__kmpc_target_deinit(%struct.ident_t* @[[GLOB1]], i8 2, i1 true) | // CHECK2-NEXT: call void @__kmpc_target_deinit(%struct.ident_t* @[[GLOB1]], i8 2, i1 true) | ||||
// CHECK2-NEXT: ret void | // CHECK2-NEXT: ret void | ||||
// CHECK2: worker.exit: | // CHECK2: worker.exit: | ||||
// CHECK2-NEXT: ret void | // CHECK2-NEXT: ret void | ||||
// | // | ||||
// | // | ||||
// CHECK2-LABEL: define {{[^@]+}}@__omp_outlined__ | // CHECK2-LABEL: define {{[^@]+}}@__omp_outlined__ | ||||
// CHECK2-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32** nonnull align 4 dereferenceable(4) [[PTR1:%.*]], i32** nonnull align 4 dereferenceable(4) [[PTR2:%.*]]) #[[ATTR1:[0-9]+]] { | // CHECK2-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32** nonnull align 4 dereferenceable(4) [[PTR1:%.*]], i32** nonnull align 4 dereferenceable(4) [[PTR2:%.*]]) #[[ATTR1:[0-9]+]] { | ||||
▲ Show 20 Lines • Show All 118 Lines • ▼ Show 20 Lines | |||||
// CHECK2-NEXT: [[ADD17:%.*]] = add nsw i64 [[TMP15]], 1 | // CHECK2-NEXT: [[ADD17:%.*]] = add nsw i64 [[TMP15]], 1 | ||||
// CHECK2-NEXT: store i64 [[ADD17]], i64* [[X]], align 8 | // CHECK2-NEXT: store i64 [[ADD17]], i64* [[X]], align 8 | ||||
// CHECK2-NEXT: [[Y:%.*]] = getelementptr inbounds [[STRUCT_TT]], %struct.TT* [[TMP7]], i32 0, i32 1 | // CHECK2-NEXT: [[Y:%.*]] = getelementptr inbounds [[STRUCT_TT]], %struct.TT* [[TMP7]], i32 0, i32 1 | ||||
// CHECK2-NEXT: [[TMP16:%.*]] = load i8, i8* [[Y]], align 8 | // CHECK2-NEXT: [[TMP16:%.*]] = load i8, i8* [[Y]], align 8 | ||||
// CHECK2-NEXT: [[CONV18:%.*]] = sext i8 [[TMP16]] to i32 | // CHECK2-NEXT: [[CONV18:%.*]] = sext i8 [[TMP16]] to i32 | ||||
// CHECK2-NEXT: [[ADD19:%.*]] = add nsw i32 [[CONV18]], 1 | // CHECK2-NEXT: [[ADD19:%.*]] = add nsw i32 [[CONV18]], 1 | ||||
// CHECK2-NEXT: [[CONV20:%.*]] = trunc i32 [[ADD19]] to i8 | // CHECK2-NEXT: [[CONV20:%.*]] = trunc i32 [[ADD19]] to i8 | ||||
// CHECK2-NEXT: store i8 [[CONV20]], i8* [[Y]], align 8 | // CHECK2-NEXT: store i8 [[CONV20]], i8* [[Y]], align 8 | ||||
// CHECK2-NEXT: [[CALL:%.*]] = call nonnull align 8 dereferenceable(8) i64* @_ZN2TTIxcEixEi(%struct.TT* nonnull align 8 dereferenceable(16) [[TMP7]], i32 0) #[[ATTR6:[0-9]+]] | // CHECK2-NEXT: [[CALL:%.*]] = call nonnull align 8 dereferenceable(8) i64* @_ZN2TTIxcEixEi(%struct.TT* nonnull align 8 dereferenceable(16) [[TMP7]], i32 0) #[[ATTR8:[0-9]+]] | ||||
// CHECK2-NEXT: [[TMP17:%.*]] = load i64, i64* [[CALL]], align 8 | // CHECK2-NEXT: [[TMP17:%.*]] = load i64, i64* [[CALL]], align 8 | ||||
// CHECK2-NEXT: [[ADD21:%.*]] = add nsw i64 [[TMP17]], 1 | // CHECK2-NEXT: [[ADD21:%.*]] = add nsw i64 [[TMP17]], 1 | ||||
// CHECK2-NEXT: store i64 [[ADD21]], i64* [[CALL]], align 8 | // CHECK2-NEXT: store i64 [[ADD21]], i64* [[CALL]], align 8 | ||||
// CHECK2-NEXT: call void @__kmpc_target_deinit(%struct.ident_t* @[[GLOB1]], i8 1, i1 true) | // CHECK2-NEXT: call void @__kmpc_target_deinit(%struct.ident_t* @[[GLOB1]], i8 1, i1 true) | ||||
// CHECK2-NEXT: ret void | // CHECK2-NEXT: ret void | ||||
// CHECK2: worker.exit: | // CHECK2: worker.exit: | ||||
// CHECK2-NEXT: ret void | // CHECK2-NEXT: ret void | ||||
// | // | ||||
// | // | ||||
// CHECK2-LABEL: define {{[^@]+}}@_ZN2TTIxcEixEi | // CHECK2-LABEL: define {{[^@]+}}@_ZN2TTIxcEixEi | ||||
// CHECK2-SAME: (%struct.TT* nonnull align 8 dereferenceable(16) [[THIS:%.*]], i32 [[I:%.*]]) #[[ATTR3:[0-9]+]] comdat align 2 { | // CHECK2-SAME: (%struct.TT* nonnull align 8 dereferenceable(16) [[THIS:%.*]], i32 [[I:%.*]]) #[[ATTR4:[0-9]+]] comdat align 2 { | ||||
// CHECK2-NEXT: entry: | // CHECK2-NEXT: entry: | ||||
// CHECK2-NEXT: [[THIS_ADDR:%.*]] = alloca %struct.TT*, align 4 | // CHECK2-NEXT: [[THIS_ADDR:%.*]] = alloca %struct.TT*, align 4 | ||||
// CHECK2-NEXT: [[I_ADDR:%.*]] = alloca i32, align 4 | // CHECK2-NEXT: [[I_ADDR:%.*]] = alloca i32, align 4 | ||||
// CHECK2-NEXT: store %struct.TT* [[THIS]], %struct.TT** [[THIS_ADDR]], align 4 | // CHECK2-NEXT: store %struct.TT* [[THIS]], %struct.TT** [[THIS_ADDR]], align 4 | ||||
// CHECK2-NEXT: store i32 [[I]], i32* [[I_ADDR]], align 4 | // CHECK2-NEXT: store i32 [[I]], i32* [[I_ADDR]], align 4 | ||||
// CHECK2-NEXT: [[THIS1:%.*]] = load %struct.TT*, %struct.TT** [[THIS_ADDR]], align 4 | // CHECK2-NEXT: [[THIS1:%.*]] = load %struct.TT*, %struct.TT** [[THIS_ADDR]], align 4 | ||||
// CHECK2-NEXT: [[X:%.*]] = getelementptr inbounds [[STRUCT_TT:%.*]], %struct.TT* [[THIS1]], i32 0, i32 0 | // CHECK2-NEXT: [[X:%.*]] = getelementptr inbounds [[STRUCT_TT:%.*]], %struct.TT* [[THIS1]], i32 0, i32 0 | ||||
// CHECK2-NEXT: ret i64* [[X]] | // CHECK2-NEXT: ret i64* [[X]] | ||||
▲ Show 20 Lines • Show All 74 Lines • ▼ Show 20 Lines | |||||
// CHECK2-NEXT: [[TMP7:%.*]] = mul nsw i32 1, [[TMP2]] | // CHECK2-NEXT: [[TMP7:%.*]] = mul nsw i32 1, [[TMP2]] | ||||
// CHECK2-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i16, i16* [[TMP3]], i32 [[TMP7]] | // CHECK2-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i16, i16* [[TMP3]], i32 [[TMP7]] | ||||
// CHECK2-NEXT: [[ARRAYIDX5:%.*]] = getelementptr inbounds i16, i16* [[ARRAYIDX]], i32 1 | // CHECK2-NEXT: [[ARRAYIDX5:%.*]] = getelementptr inbounds i16, i16* [[ARRAYIDX]], i32 1 | ||||
// CHECK2-NEXT: store i16 [[CONV4]], i16* [[ARRAYIDX5]], align 2 | // CHECK2-NEXT: store i16 [[CONV4]], i16* [[ARRAYIDX5]], align 2 | ||||
// CHECK2-NEXT: [[A6:%.*]] = getelementptr inbounds [[STRUCT_S1]], %struct.S1* [[TMP0]], i32 0, i32 0 | // CHECK2-NEXT: [[A6:%.*]] = getelementptr inbounds [[STRUCT_S1]], %struct.S1* [[TMP0]], i32 0, i32 0 | ||||
// CHECK2-NEXT: [[TMP8:%.*]] = load double, double* [[A6]], align 8 | // CHECK2-NEXT: [[TMP8:%.*]] = load double, double* [[A6]], align 8 | ||||
// CHECK2-NEXT: [[CONV7:%.*]] = fptosi double [[TMP8]] to i32 | // CHECK2-NEXT: [[CONV7:%.*]] = fptosi double [[TMP8]] to i32 | ||||
// CHECK2-NEXT: [[A8:%.*]] = getelementptr inbounds [[STRUCT_S1]], %struct.S1* [[TMP0]], i32 0, i32 0 | // CHECK2-NEXT: [[A8:%.*]] = getelementptr inbounds [[STRUCT_S1]], %struct.S1* [[TMP0]], i32 0, i32 0 | ||||
// CHECK2-NEXT: [[CALL:%.*]] = call i32 @_Z3baziRd(i32 [[CONV7]], double* nonnull align 8 dereferenceable(8) [[A8]]) #[[ATTR6]] | // CHECK2-NEXT: [[CALL:%.*]] = call i32 @_Z3baziRd(i32 [[CONV7]], double* nonnull align 8 dereferenceable(8) [[A8]]) #[[ATTR8]] | ||||
// CHECK2-NEXT: call void @__kmpc_target_deinit(%struct.ident_t* @[[GLOB1]], i8 1, i1 true) | // CHECK2-NEXT: call void @__kmpc_target_deinit(%struct.ident_t* @[[GLOB1]], i8 1, i1 true) | ||||
// CHECK2-NEXT: ret void | // CHECK2-NEXT: ret void | ||||
// CHECK2: worker.exit: | // CHECK2: worker.exit: | ||||
// CHECK2-NEXT: ret void | // CHECK2-NEXT: ret void | ||||
// | // | ||||
// | // | ||||
// CHECK2-LABEL: define {{[^@]+}}@_Z3baziRd | // CHECK2-LABEL: define {{[^@]+}}@_Z3baziRd | ||||
// CHECK2-SAME: (i32 [[F1:%.*]], double* nonnull align 8 dereferenceable(8) [[A:%.*]]) #[[ATTR3]] { | // CHECK2-SAME: (i32 [[F1:%.*]], double* nonnull align 8 dereferenceable(8) [[A:%.*]]) #[[ATTR4]] { | ||||
// CHECK2-NEXT: entry: | // CHECK2-NEXT: entry: | ||||
// CHECK2-NEXT: [[A_ADDR:%.*]] = alloca double*, align 4 | // CHECK2-NEXT: [[A_ADDR:%.*]] = alloca double*, align 4 | ||||
// CHECK2-NEXT: [[CAPTURED_VARS_ADDRS:%.*]] = alloca [2 x i8*], align 4 | // CHECK2-NEXT: [[CAPTURED_VARS_ADDRS:%.*]] = alloca [2 x i8*], align 4 | ||||
// CHECK2-NEXT: [[TMP0:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB3:[0-9]+]]) | // CHECK2-NEXT: [[TMP0:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB3:[0-9]+]]) | ||||
// CHECK2-NEXT: [[F:%.*]] = call i8* @__kmpc_alloc_shared(i32 4) | // CHECK2-NEXT: [[F:%.*]] = call i8* @__kmpc_alloc_shared(i32 4) | ||||
// CHECK2-NEXT: [[F_ON_STACK:%.*]] = bitcast i8* [[F]] to i32* | // CHECK2-NEXT: [[F_ON_STACK:%.*]] = bitcast i8* [[F]] to i32* | ||||
// CHECK2-NEXT: store i32 [[F1]], i32* [[F_ON_STACK]], align 4 | // CHECK2-NEXT: store i32 [[F1]], i32* [[F_ON_STACK]], align 4 | ||||
// CHECK2-NEXT: store double* [[A]], double** [[A_ADDR]], align 4 | // CHECK2-NEXT: store double* [[A]], double** [[A_ADDR]], align 4 | ||||
Show All 13 Lines | |||||
// | // | ||||
// CHECK2-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z16unreachable_callv_l142 | // CHECK2-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z16unreachable_callv_l142 | ||||
// CHECK2-SAME: () #[[ATTR1]] { | // CHECK2-SAME: () #[[ATTR1]] { | ||||
// CHECK2-NEXT: entry: | // CHECK2-NEXT: entry: | ||||
// CHECK2-NEXT: [[TMP0:%.*]] = call i32 @__kmpc_target_init(%struct.ident_t* @[[GLOB1]], i8 1, i1 true, i1 true) | // CHECK2-NEXT: [[TMP0:%.*]] = call i32 @__kmpc_target_init(%struct.ident_t* @[[GLOB1]], i8 1, i1 true, i1 true) | ||||
// CHECK2-NEXT: [[EXEC_USER_CODE:%.*]] = icmp eq i32 [[TMP0]], -1 | // CHECK2-NEXT: [[EXEC_USER_CODE:%.*]] = icmp eq i32 [[TMP0]], -1 | ||||
// CHECK2-NEXT: br i1 [[EXEC_USER_CODE]], label [[USER_CODE_ENTRY:%.*]], label [[WORKER_EXIT:%.*]] | // CHECK2-NEXT: br i1 [[EXEC_USER_CODE]], label [[USER_CODE_ENTRY:%.*]], label [[WORKER_EXIT:%.*]] | ||||
// CHECK2: user_code.entry: | // CHECK2: user_code.entry: | ||||
// CHECK2-NEXT: call void @_Z6asserti(i32 0) #[[ATTR7:[0-9]+]] | // CHECK2-NEXT: call void @_Z6asserti(i32 0) #[[ATTR9:[0-9]+]] | ||||
// CHECK2-NEXT: unreachable | // CHECK2-NEXT: unreachable | ||||
// CHECK2: worker.exit: | // CHECK2: worker.exit: | ||||
// CHECK2-NEXT: ret void | // CHECK2-NEXT: ret void | ||||
// CHECK2: 1: | // CHECK2: 1: | ||||
// CHECK2-NEXT: call void @__kmpc_target_deinit(%struct.ident_t* @[[GLOB1]], i8 1, i1 true) | // CHECK2-NEXT: call void @__kmpc_target_deinit(%struct.ident_t* @[[GLOB1]], i8 1, i1 true) | ||||
// CHECK2-NEXT: ret void | // CHECK2-NEXT: ret void | ||||
// | // | ||||
// | // | ||||
▲ Show 20 Lines • Show All 49 Lines • ▼ Show 20 Lines | |||||
// CHECK2-NEXT: [[TMP3:%.*]] = load double, double* [[TMP2]], align 8 | // CHECK2-NEXT: [[TMP3:%.*]] = load double, double* [[TMP2]], align 8 | ||||
// CHECK2-NEXT: [[ADD:%.*]] = fadd double 2.000000e+00, [[TMP3]] | // CHECK2-NEXT: [[ADD:%.*]] = fadd double 2.000000e+00, [[TMP3]] | ||||
// CHECK2-NEXT: [[CONV:%.*]] = fptosi double [[ADD]] to i32 | // CHECK2-NEXT: [[CONV:%.*]] = fptosi double [[ADD]] to i32 | ||||
// CHECK2-NEXT: store i32 [[CONV]], i32* [[TMP0]], align 4 | // CHECK2-NEXT: store i32 [[CONV]], i32* [[TMP0]], align 4 | ||||
// CHECK2-NEXT: ret void | // CHECK2-NEXT: ret void | ||||
// | // | ||||
// | // | ||||
// CHECK2-LABEL: define {{[^@]+}}@__omp_outlined__1_wrapper | // CHECK2-LABEL: define {{[^@]+}}@__omp_outlined__1_wrapper | ||||
// CHECK2-SAME: (i16 zeroext [[TMP0:%.*]], i32 [[TMP1:%.*]]) #[[ATTR5:[0-9]+]] { | // CHECK2-SAME: (i16 zeroext [[TMP0:%.*]], i32 [[TMP1:%.*]]) #[[ATTR7:[0-9]+]] { | ||||
// CHECK2-NEXT: entry: | // CHECK2-NEXT: entry: | ||||
// CHECK2-NEXT: [[DOTADDR:%.*]] = alloca i16, align 2 | // CHECK2-NEXT: [[DOTADDR:%.*]] = alloca i16, align 2 | ||||
// CHECK2-NEXT: [[DOTADDR1:%.*]] = alloca i32, align 4 | // CHECK2-NEXT: [[DOTADDR1:%.*]] = alloca i32, align 4 | ||||
// CHECK2-NEXT: [[DOTZERO_ADDR:%.*]] = alloca i32, align 4 | // CHECK2-NEXT: [[DOTZERO_ADDR:%.*]] = alloca i32, align 4 | ||||
// CHECK2-NEXT: [[GLOBAL_ARGS:%.*]] = alloca i8**, align 4 | // CHECK2-NEXT: [[GLOBAL_ARGS:%.*]] = alloca i8**, align 4 | ||||
// CHECK2-NEXT: store i16 [[TMP0]], i16* [[DOTADDR]], align 2 | // CHECK2-NEXT: store i16 [[TMP0]], i16* [[DOTADDR]], align 2 | ||||
// CHECK2-NEXT: store i32 [[TMP1]], i32* [[DOTADDR1]], align 4 | // CHECK2-NEXT: store i32 [[TMP1]], i32* [[DOTADDR1]], align 4 | ||||
// CHECK2-NEXT: store i32 0, i32* [[DOTZERO_ADDR]], align 4 | // CHECK2-NEXT: store i32 0, i32* [[DOTZERO_ADDR]], align 4 | ||||
Show All 25 Lines | |||||
// CHECK3-NEXT: [[TMP2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2:[0-9]+]]) | // CHECK3-NEXT: [[TMP2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2:[0-9]+]]) | ||||
// CHECK3-NEXT: [[TMP3:%.*]] = getelementptr inbounds [2 x i8*], [2 x i8*]* [[CAPTURED_VARS_ADDRS]], i32 0, i32 0 | // CHECK3-NEXT: [[TMP3:%.*]] = getelementptr inbounds [2 x i8*], [2 x i8*]* [[CAPTURED_VARS_ADDRS]], i32 0, i32 0 | ||||
// CHECK3-NEXT: [[TMP4:%.*]] = bitcast i32** [[PTR1_ADDR]] to i8* | // CHECK3-NEXT: [[TMP4:%.*]] = bitcast i32** [[PTR1_ADDR]] to i8* | ||||
// CHECK3-NEXT: store i8* [[TMP4]], i8** [[TMP3]], align 4 | // CHECK3-NEXT: store i8* [[TMP4]], i8** [[TMP3]], align 4 | ||||
// CHECK3-NEXT: [[TMP5:%.*]] = getelementptr inbounds [2 x i8*], [2 x i8*]* [[CAPTURED_VARS_ADDRS]], i32 0, i32 1 | // CHECK3-NEXT: [[TMP5:%.*]] = getelementptr inbounds [2 x i8*], [2 x i8*]* [[CAPTURED_VARS_ADDRS]], i32 0, i32 1 | ||||
// CHECK3-NEXT: [[TMP6:%.*]] = bitcast i32** [[TMP0]] to i8* | // CHECK3-NEXT: [[TMP6:%.*]] = bitcast i32** [[TMP0]] to i8* | ||||
// CHECK3-NEXT: store i8* [[TMP6]], i8** [[TMP5]], align 4 | // CHECK3-NEXT: store i8* [[TMP6]], i8** [[TMP5]], align 4 | ||||
// CHECK3-NEXT: [[TMP7:%.*]] = bitcast [2 x i8*]* [[CAPTURED_VARS_ADDRS]] to i8** | // CHECK3-NEXT: [[TMP7:%.*]] = bitcast [2 x i8*]* [[CAPTURED_VARS_ADDRS]] to i8** | ||||
// CHECK3-NEXT: call void @__kmpc_parallel_51(%struct.ident_t* @[[GLOB2]], i32 [[TMP2]], i32 1, i32 -1, i32 -1, i8* bitcast (void (i32*, i32*, i32**, i32**)* @__omp_outlined__ to i8*), i8* null, i8** [[TMP7]], i32 2) | // CHECK3-NEXT: call void @__kmpc_parallel_51(%struct.ident_t* @[[GLOB2]], i32 [[TMP2]], i32 1, i32 2, i32 -1, i8* bitcast (void (i32*, i32*, i32**, i32**)* @__omp_outlined__ to i8*), i8* null, i8** [[TMP7]], i32 2) | ||||
// CHECK3-NEXT: call void @__kmpc_target_deinit(%struct.ident_t* @[[GLOB1]], i8 2, i1 true) | // CHECK3-NEXT: call void @__kmpc_target_deinit(%struct.ident_t* @[[GLOB1]], i8 2, i1 true) | ||||
// CHECK3-NEXT: ret void | // CHECK3-NEXT: ret void | ||||
// CHECK3: worker.exit: | // CHECK3: worker.exit: | ||||
// CHECK3-NEXT: ret void | // CHECK3-NEXT: ret void | ||||
// | // | ||||
// | // | ||||
// CHECK3-LABEL: define {{[^@]+}}@__omp_outlined__ | // CHECK3-LABEL: define {{[^@]+}}@__omp_outlined__ | ||||
// CHECK3-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32** nonnull align 4 dereferenceable(4) [[PTR1:%.*]], i32** nonnull align 4 dereferenceable(4) [[PTR2:%.*]]) #[[ATTR1:[0-9]+]] { | // CHECK3-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32** nonnull align 4 dereferenceable(4) [[PTR1:%.*]], i32** nonnull align 4 dereferenceable(4) [[PTR2:%.*]]) #[[ATTR1:[0-9]+]] { | ||||
▲ Show 20 Lines • Show All 118 Lines • ▼ Show 20 Lines | |||||
// CHECK3-NEXT: [[ADD17:%.*]] = add nsw i64 [[TMP15]], 1 | // CHECK3-NEXT: [[ADD17:%.*]] = add nsw i64 [[TMP15]], 1 | ||||
// CHECK3-NEXT: store i64 [[ADD17]], i64* [[X]], align 8 | // CHECK3-NEXT: store i64 [[ADD17]], i64* [[X]], align 8 | ||||
// CHECK3-NEXT: [[Y:%.*]] = getelementptr inbounds [[STRUCT_TT]], %struct.TT* [[TMP7]], i32 0, i32 1 | // CHECK3-NEXT: [[Y:%.*]] = getelementptr inbounds [[STRUCT_TT]], %struct.TT* [[TMP7]], i32 0, i32 1 | ||||
// CHECK3-NEXT: [[TMP16:%.*]] = load i8, i8* [[Y]], align 8 | // CHECK3-NEXT: [[TMP16:%.*]] = load i8, i8* [[Y]], align 8 | ||||
// CHECK3-NEXT: [[CONV18:%.*]] = sext i8 [[TMP16]] to i32 | // CHECK3-NEXT: [[CONV18:%.*]] = sext i8 [[TMP16]] to i32 | ||||
// CHECK3-NEXT: [[ADD19:%.*]] = add nsw i32 [[CONV18]], 1 | // CHECK3-NEXT: [[ADD19:%.*]] = add nsw i32 [[CONV18]], 1 | ||||
// CHECK3-NEXT: [[CONV20:%.*]] = trunc i32 [[ADD19]] to i8 | // CHECK3-NEXT: [[CONV20:%.*]] = trunc i32 [[ADD19]] to i8 | ||||
// CHECK3-NEXT: store i8 [[CONV20]], i8* [[Y]], align 8 | // CHECK3-NEXT: store i8 [[CONV20]], i8* [[Y]], align 8 | ||||
// CHECK3-NEXT: [[CALL:%.*]] = call nonnull align 8 dereferenceable(8) i64* @_ZN2TTIxcEixEi(%struct.TT* nonnull align 8 dereferenceable(16) [[TMP7]], i32 0) #[[ATTR6:[0-9]+]] | // CHECK3-NEXT: [[CALL:%.*]] = call nonnull align 8 dereferenceable(8) i64* @_ZN2TTIxcEixEi(%struct.TT* nonnull align 8 dereferenceable(16) [[TMP7]], i32 0) #[[ATTR8:[0-9]+]] | ||||
// CHECK3-NEXT: [[TMP17:%.*]] = load i64, i64* [[CALL]], align 8 | // CHECK3-NEXT: [[TMP17:%.*]] = load i64, i64* [[CALL]], align 8 | ||||
// CHECK3-NEXT: [[ADD21:%.*]] = add nsw i64 [[TMP17]], 1 | // CHECK3-NEXT: [[ADD21:%.*]] = add nsw i64 [[TMP17]], 1 | ||||
// CHECK3-NEXT: store i64 [[ADD21]], i64* [[CALL]], align 8 | // CHECK3-NEXT: store i64 [[ADD21]], i64* [[CALL]], align 8 | ||||
// CHECK3-NEXT: call void @__kmpc_target_deinit(%struct.ident_t* @[[GLOB1]], i8 1, i1 true) | // CHECK3-NEXT: call void @__kmpc_target_deinit(%struct.ident_t* @[[GLOB1]], i8 1, i1 true) | ||||
// CHECK3-NEXT: ret void | // CHECK3-NEXT: ret void | ||||
// CHECK3: worker.exit: | // CHECK3: worker.exit: | ||||
// CHECK3-NEXT: ret void | // CHECK3-NEXT: ret void | ||||
// | // | ||||
// | // | ||||
// CHECK3-LABEL: define {{[^@]+}}@_ZN2TTIxcEixEi | // CHECK3-LABEL: define {{[^@]+}}@_ZN2TTIxcEixEi | ||||
// CHECK3-SAME: (%struct.TT* nonnull align 8 dereferenceable(16) [[THIS:%.*]], i32 [[I:%.*]]) #[[ATTR3:[0-9]+]] comdat align 2 { | // CHECK3-SAME: (%struct.TT* nonnull align 8 dereferenceable(16) [[THIS:%.*]], i32 [[I:%.*]]) #[[ATTR4:[0-9]+]] comdat align 2 { | ||||
// CHECK3-NEXT: entry: | // CHECK3-NEXT: entry: | ||||
// CHECK3-NEXT: [[THIS_ADDR:%.*]] = alloca %struct.TT*, align 4 | // CHECK3-NEXT: [[THIS_ADDR:%.*]] = alloca %struct.TT*, align 4 | ||||
// CHECK3-NEXT: [[I_ADDR:%.*]] = alloca i32, align 4 | // CHECK3-NEXT: [[I_ADDR:%.*]] = alloca i32, align 4 | ||||
// CHECK3-NEXT: store %struct.TT* [[THIS]], %struct.TT** [[THIS_ADDR]], align 4 | // CHECK3-NEXT: store %struct.TT* [[THIS]], %struct.TT** [[THIS_ADDR]], align 4 | ||||
// CHECK3-NEXT: store i32 [[I]], i32* [[I_ADDR]], align 4 | // CHECK3-NEXT: store i32 [[I]], i32* [[I_ADDR]], align 4 | ||||
// CHECK3-NEXT: [[THIS1:%.*]] = load %struct.TT*, %struct.TT** [[THIS_ADDR]], align 4 | // CHECK3-NEXT: [[THIS1:%.*]] = load %struct.TT*, %struct.TT** [[THIS_ADDR]], align 4 | ||||
// CHECK3-NEXT: [[X:%.*]] = getelementptr inbounds [[STRUCT_TT:%.*]], %struct.TT* [[THIS1]], i32 0, i32 0 | // CHECK3-NEXT: [[X:%.*]] = getelementptr inbounds [[STRUCT_TT:%.*]], %struct.TT* [[THIS1]], i32 0, i32 0 | ||||
// CHECK3-NEXT: ret i64* [[X]] | // CHECK3-NEXT: ret i64* [[X]] | ||||
▲ Show 20 Lines • Show All 74 Lines • ▼ Show 20 Lines | |||||
// CHECK3-NEXT: [[TMP7:%.*]] = mul nsw i32 1, [[TMP2]] | // CHECK3-NEXT: [[TMP7:%.*]] = mul nsw i32 1, [[TMP2]] | ||||
// CHECK3-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i16, i16* [[TMP3]], i32 [[TMP7]] | // CHECK3-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i16, i16* [[TMP3]], i32 [[TMP7]] | ||||
// CHECK3-NEXT: [[ARRAYIDX5:%.*]] = getelementptr inbounds i16, i16* [[ARRAYIDX]], i32 1 | // CHECK3-NEXT: [[ARRAYIDX5:%.*]] = getelementptr inbounds i16, i16* [[ARRAYIDX]], i32 1 | ||||
// CHECK3-NEXT: store i16 [[CONV4]], i16* [[ARRAYIDX5]], align 2 | // CHECK3-NEXT: store i16 [[CONV4]], i16* [[ARRAYIDX5]], align 2 | ||||
// CHECK3-NEXT: [[A6:%.*]] = getelementptr inbounds [[STRUCT_S1]], %struct.S1* [[TMP0]], i32 0, i32 0 | // CHECK3-NEXT: [[A6:%.*]] = getelementptr inbounds [[STRUCT_S1]], %struct.S1* [[TMP0]], i32 0, i32 0 | ||||
// CHECK3-NEXT: [[TMP8:%.*]] = load double, double* [[A6]], align 8 | // CHECK3-NEXT: [[TMP8:%.*]] = load double, double* [[A6]], align 8 | ||||
// CHECK3-NEXT: [[CONV7:%.*]] = fptosi double [[TMP8]] to i32 | // CHECK3-NEXT: [[CONV7:%.*]] = fptosi double [[TMP8]] to i32 | ||||
// CHECK3-NEXT: [[A8:%.*]] = getelementptr inbounds [[STRUCT_S1]], %struct.S1* [[TMP0]], i32 0, i32 0 | // CHECK3-NEXT: [[A8:%.*]] = getelementptr inbounds [[STRUCT_S1]], %struct.S1* [[TMP0]], i32 0, i32 0 | ||||
// CHECK3-NEXT: [[CALL:%.*]] = call i32 @_Z3baziRd(i32 [[CONV7]], double* nonnull align 8 dereferenceable(8) [[A8]]) #[[ATTR6]] | // CHECK3-NEXT: [[CALL:%.*]] = call i32 @_Z3baziRd(i32 [[CONV7]], double* nonnull align 8 dereferenceable(8) [[A8]]) #[[ATTR8]] | ||||
// CHECK3-NEXT: call void @__kmpc_target_deinit(%struct.ident_t* @[[GLOB1]], i8 1, i1 true) | // CHECK3-NEXT: call void @__kmpc_target_deinit(%struct.ident_t* @[[GLOB1]], i8 1, i1 true) | ||||
// CHECK3-NEXT: ret void | // CHECK3-NEXT: ret void | ||||
// CHECK3: worker.exit: | // CHECK3: worker.exit: | ||||
// CHECK3-NEXT: ret void | // CHECK3-NEXT: ret void | ||||
// | // | ||||
// | // | ||||
// CHECK3-LABEL: define {{[^@]+}}@_Z3baziRd | // CHECK3-LABEL: define {{[^@]+}}@_Z3baziRd | ||||
// CHECK3-SAME: (i32 [[F1:%.*]], double* nonnull align 8 dereferenceable(8) [[A:%.*]]) #[[ATTR3]] { | // CHECK3-SAME: (i32 [[F1:%.*]], double* nonnull align 8 dereferenceable(8) [[A:%.*]]) #[[ATTR4]] { | ||||
// CHECK3-NEXT: entry: | // CHECK3-NEXT: entry: | ||||
// CHECK3-NEXT: [[A_ADDR:%.*]] = alloca double*, align 4 | // CHECK3-NEXT: [[A_ADDR:%.*]] = alloca double*, align 4 | ||||
// CHECK3-NEXT: [[CAPTURED_VARS_ADDRS:%.*]] = alloca [2 x i8*], align 4 | // CHECK3-NEXT: [[CAPTURED_VARS_ADDRS:%.*]] = alloca [2 x i8*], align 4 | ||||
// CHECK3-NEXT: [[TMP0:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB3:[0-9]+]]) | // CHECK3-NEXT: [[TMP0:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB3:[0-9]+]]) | ||||
// CHECK3-NEXT: [[F:%.*]] = call i8* @__kmpc_alloc_shared(i32 4) | // CHECK3-NEXT: [[F:%.*]] = call i8* @__kmpc_alloc_shared(i32 4) | ||||
// CHECK3-NEXT: [[F_ON_STACK:%.*]] = bitcast i8* [[F]] to i32* | // CHECK3-NEXT: [[F_ON_STACK:%.*]] = bitcast i8* [[F]] to i32* | ||||
// CHECK3-NEXT: store i32 [[F1]], i32* [[F_ON_STACK]], align 4 | // CHECK3-NEXT: store i32 [[F1]], i32* [[F_ON_STACK]], align 4 | ||||
// CHECK3-NEXT: store double* [[A]], double** [[A_ADDR]], align 4 | // CHECK3-NEXT: store double* [[A]], double** [[A_ADDR]], align 4 | ||||
Show All 13 Lines | |||||
// | // | ||||
// CHECK3-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z16unreachable_callv_l142 | // CHECK3-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z16unreachable_callv_l142 | ||||
// CHECK3-SAME: () #[[ATTR1]] { | // CHECK3-SAME: () #[[ATTR1]] { | ||||
// CHECK3-NEXT: entry: | // CHECK3-NEXT: entry: | ||||
// CHECK3-NEXT: [[TMP0:%.*]] = call i32 @__kmpc_target_init(%struct.ident_t* @[[GLOB1]], i8 1, i1 true, i1 true) | // CHECK3-NEXT: [[TMP0:%.*]] = call i32 @__kmpc_target_init(%struct.ident_t* @[[GLOB1]], i8 1, i1 true, i1 true) | ||||
// CHECK3-NEXT: [[EXEC_USER_CODE:%.*]] = icmp eq i32 [[TMP0]], -1 | // CHECK3-NEXT: [[EXEC_USER_CODE:%.*]] = icmp eq i32 [[TMP0]], -1 | ||||
// CHECK3-NEXT: br i1 [[EXEC_USER_CODE]], label [[USER_CODE_ENTRY:%.*]], label [[WORKER_EXIT:%.*]] | // CHECK3-NEXT: br i1 [[EXEC_USER_CODE]], label [[USER_CODE_ENTRY:%.*]], label [[WORKER_EXIT:%.*]] | ||||
// CHECK3: user_code.entry: | // CHECK3: user_code.entry: | ||||
// CHECK3-NEXT: call void @_Z6asserti(i32 0) #[[ATTR7:[0-9]+]] | // CHECK3-NEXT: call void @_Z6asserti(i32 0) #[[ATTR9:[0-9]+]] | ||||
// CHECK3-NEXT: unreachable | // CHECK3-NEXT: unreachable | ||||
// CHECK3: worker.exit: | // CHECK3: worker.exit: | ||||
// CHECK3-NEXT: ret void | // CHECK3-NEXT: ret void | ||||
// CHECK3: 1: | // CHECK3: 1: | ||||
// CHECK3-NEXT: call void @__kmpc_target_deinit(%struct.ident_t* @[[GLOB1]], i8 1, i1 true) | // CHECK3-NEXT: call void @__kmpc_target_deinit(%struct.ident_t* @[[GLOB1]], i8 1, i1 true) | ||||
// CHECK3-NEXT: ret void | // CHECK3-NEXT: ret void | ||||
// | // | ||||
// | // | ||||
▲ Show 20 Lines • Show All 49 Lines • ▼ Show 20 Lines | |||||
// CHECK3-NEXT: [[TMP3:%.*]] = load double, double* [[TMP2]], align 8 | // CHECK3-NEXT: [[TMP3:%.*]] = load double, double* [[TMP2]], align 8 | ||||
// CHECK3-NEXT: [[ADD:%.*]] = fadd double 2.000000e+00, [[TMP3]] | // CHECK3-NEXT: [[ADD:%.*]] = fadd double 2.000000e+00, [[TMP3]] | ||||
// CHECK3-NEXT: [[CONV:%.*]] = fptosi double [[ADD]] to i32 | // CHECK3-NEXT: [[CONV:%.*]] = fptosi double [[ADD]] to i32 | ||||
// CHECK3-NEXT: store i32 [[CONV]], i32* [[TMP0]], align 4 | // CHECK3-NEXT: store i32 [[CONV]], i32* [[TMP0]], align 4 | ||||
// CHECK3-NEXT: ret void | // CHECK3-NEXT: ret void | ||||
// | // | ||||
// | // | ||||
// CHECK3-LABEL: define {{[^@]+}}@__omp_outlined__1_wrapper | // CHECK3-LABEL: define {{[^@]+}}@__omp_outlined__1_wrapper | ||||
// CHECK3-SAME: (i16 zeroext [[TMP0:%.*]], i32 [[TMP1:%.*]]) #[[ATTR5:[0-9]+]] { | // CHECK3-SAME: (i16 zeroext [[TMP0:%.*]], i32 [[TMP1:%.*]]) #[[ATTR7:[0-9]+]] { | ||||
// CHECK3-NEXT: entry: | // CHECK3-NEXT: entry: | ||||
// CHECK3-NEXT: [[DOTADDR:%.*]] = alloca i16, align 2 | // CHECK3-NEXT: [[DOTADDR:%.*]] = alloca i16, align 2 | ||||
// CHECK3-NEXT: [[DOTADDR1:%.*]] = alloca i32, align 4 | // CHECK3-NEXT: [[DOTADDR1:%.*]] = alloca i32, align 4 | ||||
// CHECK3-NEXT: [[DOTZERO_ADDR:%.*]] = alloca i32, align 4 | // CHECK3-NEXT: [[DOTZERO_ADDR:%.*]] = alloca i32, align 4 | ||||
// CHECK3-NEXT: [[GLOBAL_ARGS:%.*]] = alloca i8**, align 4 | // CHECK3-NEXT: [[GLOBAL_ARGS:%.*]] = alloca i8**, align 4 | ||||
// CHECK3-NEXT: store i16 [[TMP0]], i16* [[DOTADDR]], align 2 | // CHECK3-NEXT: store i16 [[TMP0]], i16* [[DOTADDR]], align 2 | ||||
// CHECK3-NEXT: store i32 [[TMP1]], i32* [[DOTADDR1]], align 4 | // CHECK3-NEXT: store i32 [[TMP1]], i32* [[DOTADDR1]], align 4 | ||||
// CHECK3-NEXT: store i32 0, i32* [[DOTZERO_ADDR]], align 4 | // CHECK3-NEXT: store i32 0, i32* [[DOTZERO_ADDR]], align 4 | ||||
Show All 11 Lines |