This is an archive of the discontinued LLVM Phabricator instance.

[XRay][compiler-rt] Use sanitizer_common's atomic ops
ClosedPublic

Authored by dberris on Mar 26 2017, 10:03 PM.

Download Raw Diff

Details

Reviewers

dblaikie
pelikan

Summary

Instead of std::atomic APIs for atomic operations, we instead use APIs
include with sanitizer_common. This allows us to, at runtime, not have
to depend on potentially dynamically provided implementations of these
atomic operations.

Currently only do this for x86_64.

Fixes http://llvm.org/PR32274.

Diff Detail

Build Status

Buildable 5097
Build 5097: arc lint + arc unit

Event Timeline

dberris created this revision.Mar 26 2017, 10:03 PM

Herald added a subscriber: mgorny. · View Herald TranscriptMar 26 2017, 10:03 PM

Retitle.

Overall, I like it. Except for burning CPU while waiting on someone else's write(2) to (potentially) spinning rust.

lib/xray/xray_buffer_queue.h
44	This lock is being held over all Buffers (which may not be that bad actually). It is also held during the only use of apply(), which calls retryingWriteAll() and therefore will take a lot of time, including passively waiting on system calls. It would therefore make sense to use the blocking mutex here, to avoid burning CPU for potentially milliseconds. Is there any downside to a blocking lock in this scenario? The other ones look fine as the locks only protect very small regions of memory.

fixup: use a blocking mutex in the buffer queue

lib/xray/xray_buffer_queue.h
44	For the usage patterns we have, this should not be much of a problem. Let me explain why: We expect that getting buffers and returning buffers to happen more frequently than we do calling apply(...). That should be fairly quick. The caller to apply usually is a thread that has already ensured that all threads that want to write into the buffers will have returned the buffers already. While this is an implementation detail at a higher level (in the FDR logging implementation), we kind-of know it from here. In the review thread for this original change, we decided to not hand-write our own spinlock, but it's more apt for the get and release cases. I'm fine using an explicitly blocking mutex here, but that means we're trading off the potential chance of spinning for a while (fairly low based on the way we're using this data structure) on some threads, with the potential that when we're doing FDR mode that we're blocking threads. It's easy enough to switch anyway, so I've changed it to use a blocking mutex.

pelikan accepted this revision.Mar 27 2017, 12:21 AM

This revision is now accepted and ready to land.Mar 27 2017, 12:21 AM

Submitted as rL298833.

Revision Contents

Path

Size

lib/

xray/

tests/

2 lines

16 lines

11 lines

80 lines

xray_fdr_logging_impl.h

26 lines

xray_init.cc

23 lines

xray_interface.cc

59 lines

xray_log_interface.cc

15 lines

Diff 93099

lib/xray/tests/CMakeLists.txt

Show First 20 Lines • Show All 43 Lines • ▼ Show 20 Lines	foreach(arch ${XRAY_TEST_ARCH})
if(NOT APPLE)		if(NOT APPLE)
add_compiler_rt_test(XRayUnitTests ${testname}-${arch}		add_compiler_rt_test(XRayUnitTests ${testname}-${arch}
OBJECTS ${TEST_OBJECTS}		OBJECTS ${TEST_OBJECTS}
DEPS ${TEST_DEPS}		DEPS ${TEST_DEPS}
LINK_FLAGS ${TARGET_LINK_FLAGS}		LINK_FLAGS ${TARGET_LINK_FLAGS}
-lstdc++ -lm ${CMAKE_THREAD_LIBS_INIT}		-lstdc++ -lm ${CMAKE_THREAD_LIBS_INIT}
-lpthread		-lpthread
-L${COMPILER_RT_LIBRARY_OUTPUT_DIR} -lclang_rt.xray-${arch}		-L${COMPILER_RT_LIBRARY_OUTPUT_DIR} -lclang_rt.xray-${arch}
-latomic -ldl -lrt)		-ldl -lrt)
endif()		endif()
# FIXME: Figure out how to run even just the unit tests on APPLE.		# FIXME: Figure out how to run even just the unit tests on APPLE.
endforeach()		endforeach()
endif()		endif()
endmacro()		endmacro()

if(COMPILER_RT_CAN_EXECUTE_TESTS)		if(COMPILER_RT_CAN_EXECUTE_TESTS)
add_subdirectory(unit)		add_subdirectory(unit)
endif()		endif()

lib/xray/xray_buffer_queue.h

Show All 9 Lines
// This file is a part of XRay, a dynamic runtime instrumentation system.		// This file is a part of XRay, a dynamic runtime instrumentation system.
//		//
// Defines the interface for a buffer queue implementation.		// Defines the interface for a buffer queue implementation.
//		//
//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//
#ifndef XRAY_BUFFER_QUEUE_H		#ifndef XRAY_BUFFER_QUEUE_H
#define XRAY_BUFFER_QUEUE_H		#define XRAY_BUFFER_QUEUE_H

#include <atomic>		#include "sanitizer_common/sanitizer_atomic.h"
#include <cstdint>		#include "sanitizer_common/sanitizer_mutex.h"
#include <deque>		#include <deque>
#include <mutex>
#include <unordered_set>		#include <unordered_set>
#include <utility>		#include <utility>

namespace __xray {		namespace __xray {

/// BufferQueue implements a circular queue of fixed sized buffers (much like a		/// BufferQueue implements a circular queue of fixed sized buffers (much like a
/// freelist) but is concerned mostly with making it really quick to initialise,		/// freelist) but is concerned mostly with making it really quick to initialise,
/// finalise, and get/return buffers to the queue. This is one key component of		/// finalise, and get/return buffers to the queue. This is one key component of
/// the "flight data recorder" (FDR) mode to support ongoing XRay function call		/// the "flight data recorder" (FDR) mode to support ongoing XRay function call
/// trace collection.		/// trace collection.
class BufferQueue {		class BufferQueue {
public:		public:
struct Buffer {		struct Buffer {
void *Buffer = nullptr;		void *Buffer = nullptr;
size_t Size = 0;		size_t Size = 0;
};		};

private:		private:
size_t BufferSize;		size_t BufferSize;

// We use a bool to indicate whether the Buffer has been used in this		// We use a bool to indicate whether the Buffer has been used in this
// freelist implementation.		// freelist implementation.
std::deque<std::tuple<Buffer, bool>> Buffers;		std::deque<std::tuple<Buffer, bool>> Buffers;
std::mutex Mutex;		__sanitizer::BlockingMutex Mutex;
		pelikanUnsubmitted Done Reply Inline Actions This lock is being held over all Buffers (which may not be that bad actually). It is also held during the only use of apply(), which calls retryingWriteAll() and therefore will take a lot of time, including passively waiting on system calls. It would therefore make sense to use the blocking mutex here, to avoid burning CPU for potentially milliseconds. Is there any downside to a blocking lock in this scenario? The other ones look fine as the locks only protect very small regions of memory. pelikan: This lock is being held over all Buffers (which may not be that bad actually). It is also held…
		dberrisAuthorUnsubmitted Not Done Reply Inline Actions For the usage patterns we have, this should not be much of a problem. Let me explain why: We expect that getting buffers and returning buffers to happen more frequently than we do calling apply(...). That should be fairly quick. The caller to apply usually is a thread that has already ensured that all threads that want to write into the buffers will have returned the buffers already. While this is an implementation detail at a higher level (in the FDR logging implementation), we kind-of know it from here. In the review thread for this original change, we decided to not hand-write our own spinlock, but it's more apt for the get and release cases. I'm fine using an explicitly blocking mutex here, but that means we're trading off the potential chance of spinning for a while (fairly low based on the way we're using this data structure) on some threads, with the potential that when we're doing FDR mode that we're blocking threads. It's easy enough to switch anyway, so I've changed it to use a blocking mutex. dberris: For the usage patterns we have, this should not be much of a problem. Let me explain why: - We…
std::unordered_set<void *> OwnedBuffers;		std::unordered_set<void *> OwnedBuffers;
std::atomic<bool> Finalizing;		__sanitizer::atomic_uint8_t Finalizing;

public:		public:
enum class ErrorCode : unsigned {		enum class ErrorCode : unsigned {
Ok,		Ok,
NotEnoughMemory,		NotEnoughMemory,
QueueFinalizing,		QueueFinalizing,
UnrecognizedBuffer,		UnrecognizedBuffer,
AlreadyFinalized,		AlreadyFinalized,
Show All 33 Lines	public:
ErrorCode getBuffer(Buffer &Buf);		ErrorCode getBuffer(Buffer &Buf);

/// Updates \|Buf\| to point to nullptr, with size 0.		/// Updates \|Buf\| to point to nullptr, with size 0.
///		///
/// Returns:		/// Returns:
/// - ...		/// - ...
ErrorCode releaseBuffer(Buffer &Buf);		ErrorCode releaseBuffer(Buffer &Buf);

bool finalizing() const { return Finalizing.load(std::memory_order_acquire); }		bool finalizing() const {
		return __sanitizer::atomic_load(&Finalizing,
		__sanitizer::memory_order_acquire);
		}

/// Sets the state of the BufferQueue to finalizing, which ensures that:		/// Sets the state of the BufferQueue to finalizing, which ensures that:
///		///
/// - All subsequent attempts to retrieve a Buffer will fail.		/// - All subsequent attempts to retrieve a Buffer will fail.
/// - All releaseBuffer operations will not fail.		/// - All releaseBuffer operations will not fail.
///		///
/// After a call to finalize succeeds, all subsequent calls to finalize will		/// After a call to finalize succeeds, all subsequent calls to finalize will
/// fail with std::errc::state_not_recoverable.		/// fail with std::errc::state_not_recoverable.
ErrorCode finalize();		ErrorCode finalize();

/// Applies the provided function F to each Buffer in the queue, only if the		/// Applies the provided function F to each Buffer in the queue, only if the
/// Buffer is marked 'used' (i.e. has been the result of getBuffer(...) and a		/// Buffer is marked 'used' (i.e. has been the result of getBuffer(...) and a
/// releaseBuffer(...) operation.		/// releaseBuffer(...) operation.
template <class F> void apply(F Fn) {		template <class F> void apply(F Fn) {
std::lock_guard<std::mutex> G(Mutex);		__sanitizer::BlockingMutexLock G(&Mutex);
for (const auto &T : Buffers) {		for (const auto &T : Buffers) {
if (std::get<1>(T))		if (std::get<1>(T))
Fn(std::get<0>(T));		Fn(std::get<0>(T));
}		}
}		}

// Cleans up allocated buffers.		// Cleans up allocated buffers.
~BufferQueue();		~BufferQueue();
};		};

} // namespace __xray		} // namespace __xray

#endif // XRAY_BUFFER_QUEUE_H		#endif // XRAY_BUFFER_QUEUE_H

lib/xray/xray_buffer_queue.cc

	Show All 17 Lines

	#include <cstdlib>			#include <cstdlib>
	#include <tuple>			#include <tuple>

	using namespace __xray;			using namespace __xray;
	using namespace __sanitizer;			using namespace __sanitizer;

	BufferQueue::BufferQueue(std::size_t B, std::size_t N, bool &Success)			BufferQueue::BufferQueue(std::size_t B, std::size_t N, bool &Success)
	: BufferSize(B), Buffers(N), Mutex(), OwnedBuffers(), Finalizing(false) {			: BufferSize(B), Buffers(N), Mutex(), OwnedBuffers(), Finalizing{0} {
	for (auto &T : Buffers) {			for (auto &T : Buffers) {
	void *Tmp = malloc(BufferSize);			void *Tmp = malloc(BufferSize);
	if (Tmp == nullptr) {			if (Tmp == nullptr) {
	Success = false;			Success = false;
	return;			return;
	}			}

	auto &Buf = std::get<0>(T);			auto &Buf = std::get<0>(T);
	Buf.Buffer = Tmp;			Buf.Buffer = Tmp;
	Buf.Size = B;			Buf.Size = B;
	OwnedBuffers.emplace(Tmp);			OwnedBuffers.emplace(Tmp);
	}			}
	Success = true;			Success = true;
	}			}

	BufferQueue::ErrorCode BufferQueue::getBuffer(Buffer &Buf) {			BufferQueue::ErrorCode BufferQueue::getBuffer(Buffer &Buf) {
	if (Finalizing.load(std::memory_order_acquire))			if (__sanitizer::atomic_load(&Finalizing, __sanitizer::memory_order_acquire))
	return ErrorCode::QueueFinalizing;			return ErrorCode::QueueFinalizing;
	std::lock_guard<std::mutex> Guard(Mutex);			__sanitizer::BlockingMutexLock Guard(&Mutex);
	if (Buffers.empty())			if (Buffers.empty())
	return ErrorCode::NotEnoughMemory;			return ErrorCode::NotEnoughMemory;
	auto &T = Buffers.front();			auto &T = Buffers.front();
	auto &B = std::get<0>(T);			auto &B = std::get<0>(T);
	Buf = B;			Buf = B;
	B.Buffer = nullptr;			B.Buffer = nullptr;
	B.Size = 0;			B.Size = 0;
	Buffers.pop_front();			Buffers.pop_front();
	return ErrorCode::Ok;			return ErrorCode::Ok;
	}			}

	BufferQueue::ErrorCode BufferQueue::releaseBuffer(Buffer &Buf) {			BufferQueue::ErrorCode BufferQueue::releaseBuffer(Buffer &Buf) {
	if (OwnedBuffers.count(Buf.Buffer) == 0)			if (OwnedBuffers.count(Buf.Buffer) == 0)
	return ErrorCode::UnrecognizedBuffer;			return ErrorCode::UnrecognizedBuffer;
	std::lock_guard<std::mutex> Guard(Mutex);			__sanitizer::BlockingMutexLock Guard(&Mutex);

	// Now that the buffer has been released, we mark it as "used".			// Now that the buffer has been released, we mark it as "used".
	Buffers.emplace(Buffers.end(), Buf, true /* used */);			Buffers.emplace(Buffers.end(), Buf, true /* used */);
	Buf.Buffer = nullptr;			Buf.Buffer = nullptr;
	Buf.Size = 0;			Buf.Size = 0;
	return ErrorCode::Ok;			return ErrorCode::Ok;
	}			}

	BufferQueue::ErrorCode BufferQueue::finalize() {			BufferQueue::ErrorCode BufferQueue::finalize() {
	if (Finalizing.exchange(true, std::memory_order_acq_rel))			if (__sanitizer::atomic_exchange(&Finalizing, 1,
				__sanitizer::memory_order_acq_rel))
	return ErrorCode::QueueFinalizing;			return ErrorCode::QueueFinalizing;
	return ErrorCode::Ok;			return ErrorCode::Ok;
	}			}

	BufferQueue::~BufferQueue() {			BufferQueue::~BufferQueue() {
	for (auto &T : Buffers) {			for (auto &T : Buffers) {
	auto &Buf = std::get<0>(T);			auto &Buf = std::get<0>(T);
	free(Buf.Buffer);			free(Buf.Buffer);
	}			}
	}			}

lib/xray/xray_fdr_logging.cc

	Show All 11 Lines
	// Here we implement the Flight Data Recorder mode for XRay, where we use			// Here we implement the Flight Data Recorder mode for XRay, where we use
	// compact structures to store records in memory as well as when writing out the			// compact structures to store records in memory as well as when writing out the
	// data to files.			// data to files.
	//			//
	//===----------------------------------------------------------------------===//			//===----------------------------------------------------------------------===//
	#include "xray_fdr_logging.h"			#include "xray_fdr_logging.h"
	#include <algorithm>			#include <algorithm>
	#include <bitset>			#include <bitset>
	#include <cassert>
	#include <cstring>			#include <cstring>
	#include <memory>
	#include <sys/syscall.h>			#include <sys/syscall.h>
	#include <sys/time.h>			#include <sys/time.h>
	#include <time.h>			#include <time.h>
	#include <unistd.h>			#include <unistd.h>
	#include <unordered_map>			#include <unordered_map>

				#include "sanitizer_common/sanitizer_atomic.h"
	#include "sanitizer_common/sanitizer_common.h"			#include "sanitizer_common/sanitizer_common.h"
	#include "xray/xray_interface.h"			#include "xray/xray_interface.h"
	#include "xray/xray_records.h"			#include "xray/xray_records.h"
	#include "xray_buffer_queue.h"			#include "xray_buffer_queue.h"
	#include "xray_defs.h"			#include "xray_defs.h"
	#include "xray_fdr_logging_impl.h"			#include "xray_fdr_logging_impl.h"
	#include "xray_flags.h"			#include "xray_flags.h"
	#include "xray_tsc.h"			#include "xray_tsc.h"
	#include "xray_utils.h"			#include "xray_utils.h"

	namespace __xray {			namespace __xray {

	// Global BufferQueue.			// Global BufferQueue.
	std::shared_ptr<BufferQueue> BQ;			std::shared_ptr<BufferQueue> BQ;

	std::atomic<XRayLogInitStatus> LoggingStatus{			__sanitizer::atomic_sint32_t LoggingStatus = {
	XRayLogInitStatus::XRAY_LOG_UNINITIALIZED};			XRayLogInitStatus::XRAY_LOG_UNINITIALIZED};

	std::atomic<XRayLogFlushStatus> LogFlushStatus{			__sanitizer::atomic_sint32_t LogFlushStatus = {
	XRayLogFlushStatus::XRAY_LOG_NOT_FLUSHING};			XRayLogFlushStatus::XRAY_LOG_NOT_FLUSHING};

	std::unique_ptr<FDRLoggingOptions> FDROptions;			std::unique_ptr<FDRLoggingOptions> FDROptions;

	XRayLogInitStatus fdrLoggingInit(std::size_t BufferSize, std::size_t BufferMax,			XRayLogInitStatus fdrLoggingInit(std::size_t BufferSize, std::size_t BufferMax,
	void *Options,			void *Options,
	size_t OptionsSize) XRAY_NEVER_INSTRUMENT {			size_t OptionsSize) XRAY_NEVER_INSTRUMENT {
	assert(OptionsSize == sizeof(FDRLoggingOptions));			assert(OptionsSize == sizeof(FDRLoggingOptions));
	XRayLogInitStatus CurrentStatus = XRayLogInitStatus::XRAY_LOG_UNINITIALIZED;			s32 CurrentStatus = XRayLogInitStatus::XRAY_LOG_UNINITIALIZED;
	if (!LoggingStatus.compare_exchange_strong(			if (__sanitizer::atomic_compare_exchange_strong(
	CurrentStatus, XRayLogInitStatus::XRAY_LOG_INITIALIZING,			&LoggingStatus, &CurrentStatus,
	std::memory_order_release, std::memory_order_relaxed))			XRayLogInitStatus::XRAY_LOG_INITIALIZING,
	return CurrentStatus;			__sanitizer::memory_order_release))
				return static_cast<XRayLogInitStatus>(CurrentStatus);

	FDROptions.reset(new FDRLoggingOptions());			FDROptions.reset(new FDRLoggingOptions());
	FDROptions = reinterpret_cast<FDRLoggingOptions *>(Options);			FDROptions = reinterpret_cast<FDRLoggingOptions *>(Options);
	if (FDROptions->ReportErrors)			if (FDROptions->ReportErrors)
	SetPrintfAndReportCallback(printToStdErr);			SetPrintfAndReportCallback(printToStdErr);

	bool Success = false;			bool Success = false;
	BQ = std::make_shared<BufferQueue>(BufferSize, BufferMax, Success);			BQ = std::make_shared<BufferQueue>(BufferSize, BufferMax, Success);
	if (!Success) {			if (!Success) {
	Report("BufferQueue init failed.\n");			Report("BufferQueue init failed.\n");
	return XRayLogInitStatus::XRAY_LOG_UNINITIALIZED;			return XRayLogInitStatus::XRAY_LOG_UNINITIALIZED;
	}			}

	// Install the actual handleArg0 handler after initialising the buffers.			// Install the actual handleArg0 handler after initialising the buffers.
	__xray_set_handler(fdrLoggingHandleArg0);			__xray_set_handler(fdrLoggingHandleArg0);

	LoggingStatus.store(XRayLogInitStatus::XRAY_LOG_INITIALIZED,			__sanitizer::atomic_store(&LoggingStatus,
	std::memory_order_release);			XRayLogInitStatus::XRAY_LOG_INITIALIZED,
				__sanitizer::memory_order_release);
	return XRayLogInitStatus::XRAY_LOG_INITIALIZED;			return XRayLogInitStatus::XRAY_LOG_INITIALIZED;
	}			}

	// Must finalize before flushing.			// Must finalize before flushing.
	XRayLogFlushStatus fdrLoggingFlush() XRAY_NEVER_INSTRUMENT {			XRayLogFlushStatus fdrLoggingFlush() XRAY_NEVER_INSTRUMENT {
	if (LoggingStatus.load(std::memory_order_acquire) !=			if (__sanitizer::atomic_load(&LoggingStatus,
				__sanitizer::memory_order_acquire) !=
	XRayLogInitStatus::XRAY_LOG_FINALIZED)			XRayLogInitStatus::XRAY_LOG_FINALIZED)
	return XRayLogFlushStatus::XRAY_LOG_NOT_FLUSHING;			return XRayLogFlushStatus::XRAY_LOG_NOT_FLUSHING;

	XRayLogFlushStatus Result = XRayLogFlushStatus::XRAY_LOG_NOT_FLUSHING;			s32 Result = XRayLogFlushStatus::XRAY_LOG_NOT_FLUSHING;
	if (!LogFlushStatus.compare_exchange_strong(			if (__sanitizer::atomic_compare_exchange_strong(
	Result, XRayLogFlushStatus::XRAY_LOG_FLUSHING,			&LogFlushStatus, &Result, XRayLogFlushStatus::XRAY_LOG_FLUSHING,
	std::memory_order_release, std::memory_order_relaxed))			__sanitizer::memory_order_release))
	return Result;			return static_cast<XRayLogFlushStatus>(Result);

	// Make a copy of the BufferQueue pointer to prevent other threads that may be			// Make a copy of the BufferQueue pointer to prevent other threads that may be
	// resetting it from blowing away the queue prematurely while we're dealing			// resetting it from blowing away the queue prematurely while we're dealing
	// with it.			// with it.
	auto LocalBQ = BQ;			auto LocalBQ = BQ;

	// We write out the file in the following format:			// We write out the file in the following format:
	//			//
	// 1) We write down the XRay file header with version 1, type FDR_LOG.			// 1) We write down the XRay file header with version 1, type FDR_LOG.
	// 2) Then we use the 'apply' member of the BufferQueue that's live, to			// 2) Then we use the 'apply' member of the BufferQueue that's live, to
	// ensure that at this point in time we write down the buffers that have			// ensure that at this point in time we write down the buffers that have
	// been released (and marked "used") -- we dump the full buffer for now			// been released (and marked "used") -- we dump the full buffer for now
	// (fixed-sized) and let the tools reading the buffers deal with the data			// (fixed-sized) and let the tools reading the buffers deal with the data
	// afterwards.			// afterwards.
	//			//
	int Fd = FDROptions->Fd;			int Fd = FDROptions->Fd;
	if (Fd == -1)			if (Fd == -1)
	Fd = getLogFD();			Fd = getLogFD();
	if (Fd == -1) {			if (Fd == -1) {
	auto Result = XRayLogFlushStatus::XRAY_LOG_NOT_FLUSHING;			auto Result = XRayLogFlushStatus::XRAY_LOG_NOT_FLUSHING;
	LogFlushStatus.store(Result, std::memory_order_release);			__sanitizer::atomic_store(&LogFlushStatus, Result,
				__sanitizer::memory_order_release);
	return Result;			return Result;
	}			}

	XRayFileHeader Header;			XRayFileHeader Header;
	Header.Version = 1;			Header.Version = 1;
	Header.Type = FileTypes::FDR_LOG;			Header.Type = FileTypes::FDR_LOG;
	Header.CycleFrequency = getTSCFrequency();			Header.CycleFrequency = getTSCFrequency();
	// FIXME: Actually check whether we have 'constant_tsc' and 'nonstop_tsc'			// FIXME: Actually check whether we have 'constant_tsc' and 'nonstop_tsc'
	// before setting the values in the header.			// before setting the values in the header.
	Header.ConstantTSC = 1;			Header.ConstantTSC = 1;
	Header.NonstopTSC = 1;			Header.NonstopTSC = 1;
	clock_gettime(CLOCK_REALTIME, &Header.TS);			clock_gettime(CLOCK_REALTIME, &Header.TS);
	retryingWriteAll(Fd, reinterpret_cast<char *>(&Header),			retryingWriteAll(Fd, reinterpret_cast<char *>(&Header),
	reinterpret_cast<char *>(&Header) + sizeof(Header));			reinterpret_cast<char *>(&Header) + sizeof(Header));
	LocalBQ->apply([&](const BufferQueue::Buffer &B) {			LocalBQ->apply([&](const BufferQueue::Buffer &B) {
	retryingWriteAll(Fd, reinterpret_cast<char *>(B.Buffer),			retryingWriteAll(Fd, reinterpret_cast<char *>(B.Buffer),
	reinterpret_cast<char *>(B.Buffer) + B.Size);			reinterpret_cast<char *>(B.Buffer) + B.Size);
	});			});
	LogFlushStatus.store(XRayLogFlushStatus::XRAY_LOG_FLUSHED,			__sanitizer::atomic_store(&LogFlushStatus,
	std::memory_order_release);			XRayLogFlushStatus::XRAY_LOG_FLUSHED,
				__sanitizer::memory_order_release);
	return XRayLogFlushStatus::XRAY_LOG_FLUSHED;			return XRayLogFlushStatus::XRAY_LOG_FLUSHED;
	}			}

	XRayLogInitStatus fdrLoggingFinalize() XRAY_NEVER_INSTRUMENT {			XRayLogInitStatus fdrLoggingFinalize() XRAY_NEVER_INSTRUMENT {
	XRayLogInitStatus CurrentStatus = XRayLogInitStatus::XRAY_LOG_INITIALIZED;			s32 CurrentStatus = XRayLogInitStatus::XRAY_LOG_INITIALIZED;
	if (!LoggingStatus.compare_exchange_strong(			if (__sanitizer::atomic_compare_exchange_strong(
	CurrentStatus, XRayLogInitStatus::XRAY_LOG_FINALIZING,			&LoggingStatus, &CurrentStatus,
	std::memory_order_release, std::memory_order_relaxed))			XRayLogInitStatus::XRAY_LOG_FINALIZING,
	return CurrentStatus;			__sanitizer::memory_order_release))
				return static_cast<XRayLogInitStatus>(CurrentStatus);

	// Do special things to make the log finalize itself, and not allow any more			// Do special things to make the log finalize itself, and not allow any more
	// operations to be performed until re-initialized.			// operations to be performed until re-initialized.
	BQ->finalize();			BQ->finalize();

	LoggingStatus.store(XRayLogInitStatus::XRAY_LOG_FINALIZED,			__sanitizer::atomic_store(&LoggingStatus,
	std::memory_order_release);			XRayLogInitStatus::XRAY_LOG_FINALIZED,
				__sanitizer::memory_order_release);
	return XRayLogInitStatus::XRAY_LOG_FINALIZED;			return XRayLogInitStatus::XRAY_LOG_FINALIZED;
	}			}

	XRayLogInitStatus fdrLoggingReset() XRAY_NEVER_INSTRUMENT {			XRayLogInitStatus fdrLoggingReset() XRAY_NEVER_INSTRUMENT {
	XRayLogInitStatus CurrentStatus = XRayLogInitStatus::XRAY_LOG_FINALIZED;			s32 CurrentStatus = XRayLogInitStatus::XRAY_LOG_FINALIZED;
	if (!LoggingStatus.compare_exchange_strong(			if (__sanitizer::atomic_compare_exchange_strong(
	CurrentStatus, XRayLogInitStatus::XRAY_LOG_UNINITIALIZED,			&LoggingStatus, &CurrentStatus,
	std::memory_order_release, std::memory_order_relaxed))			XRayLogInitStatus::XRAY_LOG_INITIALIZED,
	return CurrentStatus;			__sanitizer::memory_order_release))
				return static_cast<XRayLogInitStatus>(CurrentStatus);

	// Release the in-memory buffer queue.			// Release the in-memory buffer queue.
	BQ.reset();			BQ.reset();

	// Spin until the flushing status is flushed.			// Spin until the flushing status is flushed.
	XRayLogFlushStatus CurrentFlushingStatus =			s32 CurrentFlushingStatus =
	XRayLogFlushStatus::XRAY_LOG_FLUSHED;			XRayLogFlushStatus::XRAY_LOG_FLUSHED;
	while (!LogFlushStatus.compare_exchange_weak(			while (__sanitizer::atomic_compare_exchange_weak(
	CurrentFlushingStatus, XRayLogFlushStatus::XRAY_LOG_NOT_FLUSHING,			&LogFlushStatus, &CurrentFlushingStatus,
	std::memory_order_release, std::memory_order_relaxed)) {			XRayLogFlushStatus::XRAY_LOG_NOT_FLUSHING,
				__sanitizer::memory_order_release)) {
	if (CurrentFlushingStatus == XRayLogFlushStatus::XRAY_LOG_NOT_FLUSHING)			if (CurrentFlushingStatus == XRayLogFlushStatus::XRAY_LOG_NOT_FLUSHING)
	break;			break;
	CurrentFlushingStatus = XRayLogFlushStatus::XRAY_LOG_FLUSHED;			CurrentFlushingStatus = XRayLogFlushStatus::XRAY_LOG_FLUSHED;
	}			}

	// At this point, we know that the status is flushed, and that we can assume			// At this point, we know that the status is flushed, and that we can assume
	return XRayLogInitStatus::XRAY_LOG_UNINITIALIZED;			return XRayLogInitStatus::XRAY_LOG_UNINITIALIZED;
	}			}
	Show All 26 Lines

lib/xray/xray_fdr_logging_impl.h

Show All 14 Lines
//		//
//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//
#ifndef XRAY_XRAY_FDR_LOGGING_IMPL_H		#ifndef XRAY_XRAY_FDR_LOGGING_IMPL_H
#define XRAY_XRAY_FDR_LOGGING_IMPL_H		#define XRAY_XRAY_FDR_LOGGING_IMPL_H

#include <cassert>		#include <cassert>
#include <cstdint>		#include <cstdint>
#include <cstring>		#include <cstring>
		#include <limits>
#include <memory>		#include <memory>
#include <string>		#include <string>
#include <sys/syscall.h>		#include <sys/syscall.h>
#include <unistd.h>		#include <unistd.h>

#include "sanitizer_common/sanitizer_common.h"		#include "sanitizer_common/sanitizer_common.h"
#include "xray/xray_log_interface.h"		#include "xray/xray_log_interface.h"
#include "xray_buffer_queue.h"		#include "xray_buffer_queue.h"
▲ Show 20 Lines • Show All 55 Lines • ▼ Show 20 Lines
static void writeTSCWrapMetadata(uint64_t TSC);		static void writeTSCWrapMetadata(uint64_t TSC);

/// Here's where the meat of the processing happens. The writer captures		/// Here's where the meat of the processing happens. The writer captures
/// function entry, exit and tail exit points with a time and will create		/// function entry, exit and tail exit points with a time and will create
/// TSCWrap, NewCPUId and Function records as necessary. The writer might		/// TSCWrap, NewCPUId and Function records as necessary. The writer might
/// walk backward through its buffer and erase trivial functions to avoid		/// walk backward through its buffer and erase trivial functions to avoid
/// polluting the log and may use the buffer queue to obtain or release a		/// polluting the log and may use the buffer queue to obtain or release a
/// buffer.		/// buffer.
static void		static void processFunctionHook(int32_t FuncId, XRayEntryType Entry,
processFunctionHook(int32_t FuncId, XRayEntryType Entry, uint64_t TSC,		uint64_t TSC, unsigned char CPU,
unsigned char CPU,		int (*wall_clock_reader)(clockid_t,
int (wall_clock_reader)(clockid_t, struct timespec ),		struct timespec *),
const std::atomic<XRayLogInitStatus> &LoggingStatus,		__sanitizer::atomic_sint32_t &LoggingStatus,
const std::shared_ptr<BufferQueue> &BQ);		const std::shared_ptr<BufferQueue> &BQ);

//-----------------------------------------------------------------------------\|		//-----------------------------------------------------------------------------\|
// The rest of the file is implementation. \|		// The rest of the file is implementation. \|
//-----------------------------------------------------------------------------\|		//-----------------------------------------------------------------------------\|
// Functions are implemented in the header for inlining since we don't want \|		// Functions are implemented in the header for inlining since we don't want \|
// to grow the stack when we've hijacked the binary for logging. \|		// to grow the stack when we've hijacked the binary for logging. \|
//-----------------------------------------------------------------------------\|		//-----------------------------------------------------------------------------\|

▲ Show 20 Lines • Show All 53 Lines • ▼ Show 20 Lines	public:

~RecursionGuard() noexcept {		~RecursionGuard() noexcept {
if (Valid)		if (Valid)
Running = false;		Running = false;
}		}
};		};

static inline bool loggingInitialized(		static inline bool loggingInitialized(
const std::atomic<XRayLogInitStatus> &LoggingStatus) XRAY_NEVER_INSTRUMENT {		const __sanitizer::atomic_sint32_t &LoggingStatus) XRAY_NEVER_INSTRUMENT {
return LoggingStatus.load(std::memory_order_acquire) ==		return __sanitizer::atomic_load(&LoggingStatus,
		__sanitizer::memory_order_acquire) ==
XRayLogInitStatus::XRAY_LOG_INITIALIZED;		XRayLogInitStatus::XRAY_LOG_INITIALIZED;
}		}

} // namespace		} // namespace

static inline void writeNewBufferPreamble(pid_t Tid, timespec TS,		static inline void writeNewBufferPreamble(pid_t Tid, timespec TS,
char *&MemPtr) XRAY_NEVER_INSTRUMENT {		char *&MemPtr) XRAY_NEVER_INSTRUMENT {
static constexpr int InitRecordsCount = 2;		static constexpr int InitRecordsCount = 2;
▲ Show 20 Lines • Show All 121 Lines • ▼ Show 20 Lines	static inline void writeFunctionRecord(int FuncId, uint32_t TSCDelta,

std::memcpy(MemPtr, &AlignedFuncRecordBuffer, sizeof(FunctionRecord));		std::memcpy(MemPtr, &AlignedFuncRecordBuffer, sizeof(FunctionRecord));
MemPtr += sizeof(FunctionRecord);		MemPtr += sizeof(FunctionRecord);
}		}

static inline void processFunctionHook(		static inline void processFunctionHook(
int32_t FuncId, XRayEntryType Entry, uint64_t TSC, unsigned char CPU,		int32_t FuncId, XRayEntryType Entry, uint64_t TSC, unsigned char CPU,
int (wall_clock_reader)(clockid_t, struct timespec ),		int (wall_clock_reader)(clockid_t, struct timespec ),
const std::atomic<XRayLogInitStatus> &LoggingStatus,		__sanitizer::atomic_sint32_t &LoggingStatus,
const std::shared_ptr<BufferQueue> &BQ) XRAY_NEVER_INSTRUMENT {		const std::shared_ptr<BufferQueue> &BQ) XRAY_NEVER_INSTRUMENT {
// Bail out right away if logging is not initialized yet.		// Bail out right away if logging is not initialized yet.
if (LoggingStatus.load(std::memory_order_acquire) !=		if (__sanitizer::atomic_load(&LoggingStatus,
		__sanitizer::memory_order_acquire) !=
XRayLogInitStatus::XRAY_LOG_INITIALIZED)		XRayLogInitStatus::XRAY_LOG_INITIALIZED)
return;		return;

// We use a thread_local variable to keep track of which CPUs we've already		// We use a thread_local variable to keep track of which CPUs we've already
// run, and the TSC times for these CPUs. This allows us to stop repeating the		// run, and the TSC times for these CPUs. This allows us to stop repeating the
// CPU field in the function records.		// CPU field in the function records.
//		//
// We assume that we'll support only 65536 CPUs for x86_64.		// We assume that we'll support only 65536 CPUs for x86_64.
Show All 27 Lines	if (EC != BufferQueue::ErrorCode::Ok) {
return;		return;
}		}
RecordPtr = nullptr;		RecordPtr = nullptr;
}		}

if (Buffer.Buffer == nullptr) {		if (Buffer.Buffer == nullptr) {
auto EC = LocalBQ->getBuffer(Buffer);		auto EC = LocalBQ->getBuffer(Buffer);
if (EC != BufferQueue::ErrorCode::Ok) {		if (EC != BufferQueue::ErrorCode::Ok) {
auto LS = LoggingStatus.load(std::memory_order_acquire);		auto LS = __sanitizer::atomic_load(&LoggingStatus,
		__sanitizer::memory_order_acquire);
if (LS != XRayLogInitStatus::XRAY_LOG_FINALIZING &&		if (LS != XRayLogInitStatus::XRAY_LOG_FINALIZING &&
LS != XRayLogInitStatus::XRAY_LOG_FINALIZED)		LS != XRayLogInitStatus::XRAY_LOG_FINALIZED)
Report("Failed to acquire a buffer; error=%s\n",		Report("Failed to acquire a buffer; error=%s\n",
BufferQueue::getErrorString(EC));		BufferQueue::getErrorString(EC));
return;		return;
}		}

setupNewBuffer(Buffer, wall_clock_reader);		setupNewBuffer(Buffer, wall_clock_reader);
▲ Show 20 Lines • Show All 132 Lines • Show Last 20 Lines

lib/xray/xray_init.cc

	//===-- xray_init.cc --------------------------------------------- C++ --===//			//===-- xray_init.cc --------------------------------------------- C++ --===//
	//			//
	// The LLVM Compiler Infrastructure			// The LLVM Compiler Infrastructure
	//			//
	// This file is distributed under the University of Illinois Open Source			// This file is distributed under the University of Illinois Open Source
	// License. See LICENSE.TXT for details.			// License. See LICENSE.TXT for details.
	//			//
	//===----------------------------------------------------------------------===//			//===----------------------------------------------------------------------===//
	//			//
	// This file is a part of XRay, a dynamic runtime instrumentation system.			// This file is a part of XRay, a dynamic runtime instrumentation system.
	//			//
	// XRay initialisation logic.			// XRay initialisation logic.
	//===----------------------------------------------------------------------===//			//===----------------------------------------------------------------------===//

	#include <atomic>
	#include <fcntl.h>			#include <fcntl.h>
	#include <strings.h>			#include <strings.h>
	#include <unistd.h>			#include <unistd.h>

	#include "sanitizer_common/sanitizer_common.h"			#include "sanitizer_common/sanitizer_common.h"
	#include "xray_defs.h"			#include "xray_defs.h"
	#include "xray_flags.h"			#include "xray_flags.h"
	#include "xray_interface_internal.h"			#include "xray_interface_internal.h"

	extern "C" {			extern "C" {
	void __xray_init();			void __xray_init();
	extern const XRaySledEntry __start_xray_instr_map[] __attribute__((weak));			extern const XRaySledEntry __start_xray_instr_map[] __attribute__((weak));
	extern const XRaySledEntry __stop_xray_instr_map[] __attribute__((weak));			extern const XRaySledEntry __stop_xray_instr_map[] __attribute__((weak));
	}			}

	using namespace __sanitizer;
	using namespace __xray;			using namespace __xray;

	// When set to 'true' this means the XRay runtime has been initialised. We use			// When set to 'true' this means the XRay runtime has been initialised. We use
	// the weak symbols defined above (__start_xray_inst_map and			// the weak symbols defined above (__start_xray_inst_map and
	// __stop_xray_instr_map) to initialise the instrumentation map that XRay uses			// __stop_xray_instr_map) to initialise the instrumentation map that XRay uses
	// for runtime patching/unpatching of instrumentation points.			// for runtime patching/unpatching of instrumentation points.
	//			//
	// FIXME: Support DSO instrumentation maps too. The current solution only works			// FIXME: Support DSO instrumentation maps too. The current solution only works
	// for statically linked executables.			// for statically linked executables.
	std::atomic<bool> XRayInitialized{false};			__sanitizer::atomic_uint8_t XRayInitialized{0};

	// This should always be updated before XRayInitialized is updated.			// This should always be updated before XRayInitialized is updated.
	std::atomic<__xray::XRaySledMap> XRayInstrMap{};			__sanitizer::SpinMutex XRayInstrMapMutex;
				XRaySledMap XRayInstrMap;

	// __xray_init() will do the actual loading of the current process' memory map			// __xray_init() will do the actual loading of the current process' memory map
	// and then proceed to look for the .xray_instr_map section/segment.			// and then proceed to look for the .xray_instr_map section/segment.
	void __xray_init() XRAY_NEVER_INSTRUMENT {			void __xray_init() XRAY_NEVER_INSTRUMENT {
	initializeFlags();			initializeFlags();
	if (__start_xray_instr_map == nullptr) {			if (__start_xray_instr_map == nullptr) {
	Report("XRay instrumentation map missing. Not initializing XRay.\n");			Report("XRay instrumentation map missing. Not initializing XRay.\n");
	return;			return;
	}			}

	// Now initialize the XRayInstrMap global struct with the address of the			{
	// entries, reinterpreted as an array of XRaySledEntry objects. We use the			__sanitizer::SpinMutexLock Guard(&XRayInstrMapMutex);
	// virtual pointer we have from the section to provide us the correct			XRayInstrMap.Sleds = __start_xray_instr_map;
	// information.			XRayInstrMap.Entries = __stop_xray_instr_map - __start_xray_instr_map;
	__xray::XRaySledMap SledMap{};			}
	SledMap.Sleds = __start_xray_instr_map;			__sanitizer::atomic_store(&XRayInitialized, true,
	SledMap.Entries = __stop_xray_instr_map - __start_xray_instr_map;			__sanitizer::memory_order_release);
	XRayInstrMap.store(SledMap, std::memory_order_release);
	XRayInitialized.store(true, std::memory_order_release);

	if (flags()->patch_premain)			if (flags()->patch_premain)
	__xray_patch();			__xray_patch();
	}			}

	__attribute__((section(".preinit_array"),			__attribute__((section(".preinit_array"),
	used)) void (*__local_xray_preinit)(void) = __xray_init;			used)) void (*__local_xray_preinit)(void) = __xray_init;

lib/xray/xray_interface.cc

Show All 9 Lines
// This file is a part of XRay, a dynamic runtime instrumentation system.		// This file is a part of XRay, a dynamic runtime instrumentation system.
//		//
// Implementation of the API functions.		// Implementation of the API functions.
//		//
//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//

#include "xray_interface_internal.h"		#include "xray_interface_internal.h"

#include <atomic>
#include <cstdint>		#include <cstdint>
#include <cstdio>		#include <cstdio>
#include <errno.h>		#include <errno.h>
#include <limits>		#include <limits>
#include <sys/mman.h>		#include <sys/mman.h>

#include "sanitizer_common/sanitizer_common.h"		#include "sanitizer_common/sanitizer_common.h"
#include "xray_defs.h"		#include "xray_defs.h"
Show All 14 Lines
static const int16_t cSledLength = 64;		static const int16_t cSledLength = 64;
#elif defined(__powerpc64__)		#elif defined(__powerpc64__)
static const int16_t cSledLength = 8;		static const int16_t cSledLength = 8;
#else		#else
#error "Unsupported CPU Architecture"		#error "Unsupported CPU Architecture"
#endif /* CPU architecture */		#endif /* CPU architecture */

// This is the function to call when we encounter the entry or exit sleds.		// This is the function to call when we encounter the entry or exit sleds.
std::atomic<void (*)(int32_t, XRayEntryType)> XRayPatchedFunction{nullptr};		__sanitizer::atomic_uintptr_t XRayPatchedFunction{0};

// This is the function to call from the arg1-enabled sleds/trampolines.		// This is the function to call from the arg1-enabled sleds/trampolines.
std::atomic<void (*)(int32_t, XRayEntryType, uint64_t)> XRayArgLogger{nullptr};		__sanitizer::atomic_uintptr_t XRayArgLogger{0};

// MProtectHelper is an RAII wrapper for calls to mprotect(...) that will undo		// MProtectHelper is an RAII wrapper for calls to mprotect(...) that will undo
// any successful mprotect(...) changes. This is used to make a page writeable		// any successful mprotect(...) changes. This is used to make a page writeable
// and executable, and upon destruction if it was successful in doing so returns		// and executable, and upon destruction if it was successful in doing so returns
// the page into a read-only and executable page.		// the page into a read-only and executable page.
//		//
// This is only used specifically for runtime-patching of the XRay		// This is only used specifically for runtime-patching of the XRay
// instrumentation points. This assumes that the executable pages are originally		// instrumentation points. This assumes that the executable pages are originally
Show All 22 Lines	~MProtectHelper() XRAY_NEVER_INSTRUMENT {
if (MustCleanup) {		if (MustCleanup) {
mprotect(PageAlignedAddr, MProtectLen, PROT_READ \| PROT_EXEC);		mprotect(PageAlignedAddr, MProtectLen, PROT_READ \| PROT_EXEC);
}		}
}		}
};		};

} // namespace __xray		} // namespace __xray

extern std::atomic<bool> XRayInitialized;		extern __sanitizer::SpinMutex XRayInstrMapMutex;
extern std::atomic<__xray::XRaySledMap> XRayInstrMap;		extern __sanitizer::atomic_uint8_t XRayInitialized;
		extern __xray::XRaySledMap XRayInstrMap;

int __xray_set_handler(void (*entry)(int32_t,		int __xray_set_handler(void (*entry)(int32_t,
XRayEntryType)) XRAY_NEVER_INSTRUMENT {		XRayEntryType)) XRAY_NEVER_INSTRUMENT {
if (XRayInitialized.load(std::memory_order_acquire)) {		if (__sanitizer::atomic_load(&XRayInitialized,
__xray::XRayPatchedFunction.store(entry, std::memory_order_release);		__sanitizer::memory_order_acquire)) {

		__sanitizer::atomic_store(&__xray::XRayPatchedFunction,
		reinterpret_cast<uint64_t>(entry),
		__sanitizer::memory_order_release);
return 1;		return 1;
}		}
return 0;		return 0;
}		}

int __xray_remove_handler() XRAY_NEVER_INSTRUMENT {		int __xray_remove_handler() XRAY_NEVER_INSTRUMENT {
return __xray_set_handler(nullptr);		return __xray_set_handler(nullptr);
}		}

std::atomic<bool> XRayPatching{false};		__sanitizer::atomic_uint8_t XRayPatching{0};

using namespace __xray;		using namespace __xray;

// FIXME: Figure out whether we can move this class to sanitizer_common instead		// FIXME: Figure out whether we can move this class to sanitizer_common instead
// as a generic "scope guard".		// as a generic "scope guard".
template <class Function> class CleanupInvoker {		template <class Function> class CleanupInvoker {
Function Fn;		Function Fn;

Show All 11 Lines
CleanupInvoker<Function> scopeCleanup(Function Fn) XRAY_NEVER_INSTRUMENT {		CleanupInvoker<Function> scopeCleanup(Function Fn) XRAY_NEVER_INSTRUMENT {
return CleanupInvoker<Function>{Fn};		return CleanupInvoker<Function>{Fn};
}		}

// controlPatching implements the common internals of the patching/unpatching		// controlPatching implements the common internals of the patching/unpatching
// implementation. \|Enable\| defines whether we're enabling or disabling the		// implementation. \|Enable\| defines whether we're enabling or disabling the
// runtime XRay instrumentation.		// runtime XRay instrumentation.
XRayPatchingStatus controlPatching(bool Enable) XRAY_NEVER_INSTRUMENT {		XRayPatchingStatus controlPatching(bool Enable) XRAY_NEVER_INSTRUMENT {
if (!XRayInitialized.load(std::memory_order_acquire))		if (!__sanitizer::atomic_load(&XRayInitialized,
		__sanitizer::memory_order_acquire))
return XRayPatchingStatus::NOT_INITIALIZED; // Not initialized.		return XRayPatchingStatus::NOT_INITIALIZED; // Not initialized.

static bool NotPatching = false;		uint8_t NotPatching = false;
if (!XRayPatching.compare_exchange_strong(NotPatching, true,		if (!__sanitizer::atomic_compare_exchange_strong(
std::memory_order_acq_rel,		&XRayPatching, &NotPatching, true, __sanitizer::memory_order_acq_rel))
std::memory_order_acquire)) {
return XRayPatchingStatus::ONGOING; // Already patching.		return XRayPatchingStatus::ONGOING; // Already patching.
}

bool PatchingSuccess = false;		uint8_t PatchingSuccess = false;
auto XRayPatchingStatusResetter = scopeCleanup([&PatchingSuccess] {		auto XRayPatchingStatusResetter = scopeCleanup([&PatchingSuccess] {
if (!PatchingSuccess) {		if (!PatchingSuccess)
XRayPatching.store(false, std::memory_order_release);		__sanitizer::atomic_store(&XRayPatching, false,
}		__sanitizer::memory_order_release);
});		});

// Step 1: Compute the function id, as a unique identifier per function in the		// Step 1: Compute the function id, as a unique identifier per function in the
// instrumentation map.		// instrumentation map.
XRaySledMap InstrMap = XRayInstrMap.load(std::memory_order_acquire);		XRaySledMap InstrMap;
		{
		__sanitizer::SpinMutexLock Guard(&XRayInstrMapMutex);
		InstrMap = XRayInstrMap;
		}
if (InstrMap.Entries == 0)		if (InstrMap.Entries == 0)
return XRayPatchingStatus::NOT_INITIALIZED;		return XRayPatchingStatus::NOT_INITIALIZED;

const uint64_t PageSize = GetPageSizeCached();		const uint64_t PageSize = GetPageSizeCached();
if ((PageSize == 0) \|\| ((PageSize & (PageSize - 1)) != 0)) {		if ((PageSize == 0) \|\| ((PageSize & (PageSize - 1)) != 0)) {
Report("System page size is not a power of two: %lld\n", PageSize);		Report("System page size is not a power of two: %lld\n", PageSize);
return XRayPatchingStatus::FAILED;		return XRayPatchingStatus::FAILED;
}		}
Show All 37 Lines	case XRayEntryType::LOG_ARGS_ENTRY:
Success = patchFunctionEntry(Enable, FuncId, Sled, __xray_ArgLoggerEntry);		Success = patchFunctionEntry(Enable, FuncId, Sled, __xray_ArgLoggerEntry);
break;		break;
default:		default:
Report("Unsupported sled kind: %d\n", int(Sled.Kind));		Report("Unsupported sled kind: %d\n", int(Sled.Kind));
continue;		continue;
}		}
(void)Success;		(void)Success;
}		}
XRayPatching.store(false, std::memory_order_release);		__sanitizer::atomic_store(&XRayPatching, false,
		__sanitizer::memory_order_release);
PatchingSuccess = true;		PatchingSuccess = true;
return XRayPatchingStatus::SUCCESS;		return XRayPatchingStatus::SUCCESS;
}		}

XRayPatchingStatus __xray_patch() XRAY_NEVER_INSTRUMENT {		XRayPatchingStatus __xray_patch() XRAY_NEVER_INSTRUMENT {
return controlPatching(true);		return controlPatching(true);
}		}

XRayPatchingStatus __xray_unpatch() XRAY_NEVER_INSTRUMENT {		XRayPatchingStatus __xray_unpatch() XRAY_NEVER_INSTRUMENT {
return controlPatching(false);		return controlPatching(false);
}		}

int __xray_set_handler_arg1(void (*Handler)(int32_t, XRayEntryType, uint64_t))		int __xray_set_handler_arg1(void (*Handler)(int32_t, XRayEntryType, uint64_t)) {
{		if (!__sanitizer::atomic_load(&XRayInitialized,
if (!XRayInitialized.load(std::memory_order_acquire)) {		__sanitizer::memory_order_acquire))
return 0;		return 0;
}
// A relaxed write might not be visible even if the current thread gets		// A relaxed write might not be visible even if the current thread gets
// scheduled on a different CPU/NUMA node. We need to wait for everyone to		// scheduled on a different CPU/NUMA node. We need to wait for everyone to
// have this handler installed for consistency of collected data across CPUs.		// have this handler installed for consistency of collected data across CPUs.
XRayArgLogger.store(Handler, std::memory_order_release);		__sanitizer::atomic_store(&XRayArgLogger, reinterpret_cast<uint64_t>(Handler),
		__sanitizer::memory_order_release);
return 1;		return 1;
}		}
int __xray_remove_handler_arg1() { return __xray_set_handler_arg1(nullptr); }		int __xray_remove_handler_arg1() { return __xray_set_handler_arg1(nullptr); }

lib/xray/xray_log_interface.cc

	//===-- xray_log_interface.cc ---------------------------------------------===//			//===-- xray_log_interface.cc ---------------------------------------------===//
	//			//
	// The LLVM Compiler Infrastructure			// The LLVM Compiler Infrastructure
	//			//
	// This file is distributed under the University of Illinois Open Source			// This file is distributed under the University of Illinois Open Source
	// License. See LICENSE.TXT for details.			// License. See LICENSE.TXT for details.
	//			//
	//===----------------------------------------------------------------------===//			//===----------------------------------------------------------------------===//
	//			//
	// This file is a part of XRay, a function call tracing system.			// This file is a part of XRay, a function call tracing system.
	//			//
	//===----------------------------------------------------------------------===//			//===----------------------------------------------------------------------===//
	#include "xray/xray_log_interface.h"			#include "xray/xray_log_interface.h"

				#include "sanitizer_common/sanitizer_atomic.h"
				#include "sanitizer_common/sanitizer_mutex.h"
	#include "xray/xray_interface.h"			#include "xray/xray_interface.h"
	#include "xray_defs.h"			#include "xray_defs.h"

	#include <memory>			#include <memory>
	#include <mutex>

	std::mutex XRayImplMutex;			__sanitizer::SpinMutex XRayImplMutex;
	std::unique_ptr<XRayLogImpl> GlobalXRayImpl;			std::unique_ptr<XRayLogImpl> GlobalXRayImpl;

	void __xray_set_log_impl(XRayLogImpl Impl) XRAY_NEVER_INSTRUMENT {			void __xray_set_log_impl(XRayLogImpl Impl) XRAY_NEVER_INSTRUMENT {
	if (Impl.log_init == nullptr \|\| Impl.log_finalize == nullptr \|\|			if (Impl.log_init == nullptr \|\| Impl.log_finalize == nullptr \|\|
	Impl.handle_arg0 == nullptr \|\| Impl.flush_log == nullptr) {			Impl.handle_arg0 == nullptr \|\| Impl.flush_log == nullptr) {
	std::lock_guard<std::mutex> Guard(XRayImplMutex);			__sanitizer::SpinMutexLock Guard(&XRayImplMutex);
	GlobalXRayImpl.reset();			GlobalXRayImpl.reset();
	return;			return;
	}			}

	std::lock_guard<std::mutex> Guard(XRayImplMutex);			__sanitizer::SpinMutexLock Guard(&XRayImplMutex);
	GlobalXRayImpl.reset(new XRayLogImpl);			GlobalXRayImpl.reset(new XRayLogImpl);
	*GlobalXRayImpl = Impl;			*GlobalXRayImpl = Impl;
	}			}

	XRayLogInitStatus __xray_init(size_t BufferSize, size_t MaxBuffers, void *Args,			XRayLogInitStatus __xray_init(size_t BufferSize, size_t MaxBuffers, void *Args,
	size_t ArgsSize) XRAY_NEVER_INSTRUMENT {			size_t ArgsSize) XRAY_NEVER_INSTRUMENT {
	std::lock_guard<std::mutex> Guard(XRayImplMutex);			__sanitizer::SpinMutexLock Guard(&XRayImplMutex);
	if (!GlobalXRayImpl)			if (!GlobalXRayImpl)
	return XRayLogInitStatus::XRAY_LOG_UNINITIALIZED;			return XRayLogInitStatus::XRAY_LOG_UNINITIALIZED;
	return GlobalXRayImpl->log_init(BufferSize, MaxBuffers, Args, ArgsSize);			return GlobalXRayImpl->log_init(BufferSize, MaxBuffers, Args, ArgsSize);
	}			}

	XRayLogInitStatus __xray_log_finalize() XRAY_NEVER_INSTRUMENT {			XRayLogInitStatus __xray_log_finalize() XRAY_NEVER_INSTRUMENT {
	std::lock_guard<std::mutex> Guard(XRayImplMutex);			__sanitizer::SpinMutexLock Guard(&XRayImplMutex);
	if (!GlobalXRayImpl)			if (!GlobalXRayImpl)
	return XRayLogInitStatus::XRAY_LOG_UNINITIALIZED;			return XRayLogInitStatus::XRAY_LOG_UNINITIALIZED;
	return GlobalXRayImpl->log_finalize();			return GlobalXRayImpl->log_finalize();
	}			}

	XRayLogFlushStatus __xray_log_flushLog() XRAY_NEVER_INSTRUMENT {			XRayLogFlushStatus __xray_log_flushLog() XRAY_NEVER_INSTRUMENT {
	std::lock_guard<std::mutex> Guard(XRayImplMutex);			__sanitizer::SpinMutexLock Guard(&XRayImplMutex);
	if (!GlobalXRayImpl)			if (!GlobalXRayImpl)
	return XRayLogFlushStatus::XRAY_LOG_NOT_FLUSHING;			return XRayLogFlushStatus::XRAY_LOG_NOT_FLUSHING;
	return GlobalXRayImpl->flush_log();			return GlobalXRayImpl->flush_log();
	}			}