diff --git a/openmp/libomptarget/src/interface.cpp b/openmp/libomptarget/src/interface.cpp --- a/openmp/libomptarget/src/interface.cpp +++ b/openmp/libomptarget/src/interface.cpp @@ -299,8 +299,12 @@ int32_t ThreadLimit, void *HostPtr, KernelArgsTy *KernelArgs) { TIMESCOPE_WITH_IDENT(Loc); - return targetKernel(Loc, DeviceId, NumTeams, ThreadLimit, - HostPtr, KernelArgs); + if (KernelArgs->Flags.NoWait) + return targetKernel( + Loc, DeviceId, NumTeams, ThreadLimit, HostPtr, KernelArgs); + else + return targetKernel(Loc, DeviceId, NumTeams, ThreadLimit, + HostPtr, KernelArgs); } /// Implements a target kernel entry that replays a pre-recorded kernel.