Diff 178449

clangd/index/BackgroundIndexStorage.cpp

//== BackgroundIndexStorage.cpp - Provide caching support to BackgroundIndex ==/		//== BackgroundIndexStorage.cpp - Provide caching support to BackgroundIndex ==/
//		//
// The LLVM Compiler Infrastructure		// The LLVM Compiler Infrastructure
//		//
// This file is distributed under the University of Illinois Open Source		// This file is distributed under the University of Illinois Open Source
// License. See LICENSE.TXT for details.		// License. See LICENSE.TXT for details.
//		//
//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//

#include "Logger.h"		#include "Logger.h"
#include "index/Background.h"		#include "index/Background.h"
		#include "llvm/ADT/ScopeExit.h"
		#include "llvm/Support/Error.h"
#include "llvm/Support/FileSystem.h"		#include "llvm/Support/FileSystem.h"
#include "llvm/Support/MemoryBuffer.h"		#include "llvm/Support/MemoryBuffer.h"
#include "llvm/Support/Path.h"		#include "llvm/Support/Path.h"
#include "llvm/Support/SHA1.h"		#include "llvm/Support/SHA1.h"

namespace clang {		namespace clang {
namespace clangd {		namespace clangd {
namespace {		namespace {

using FileDigest = decltype(llvm::SHA1::hash({}));		using FileDigest = decltype(llvm::SHA1::hash({}));

static FileDigest digest(StringRef Content) {		static FileDigest digest(StringRef Content) {
return llvm::SHA1::hash({(const uint8_t *)Content.data(), Content.size()});		return llvm::SHA1::hash({(const uint8_t *)Content.data(), Content.size()});
}		}

std::string getShardPathFromFilePath(llvm::StringRef ShardRoot,		std::string getShardPathFromFilePath(llvm::StringRef ShardRoot,
llvm::StringRef FilePath) {		llvm::StringRef FilePath) {
llvm::SmallString<128> ShardRootSS(ShardRoot);		llvm::SmallString<128> ShardRootSS(ShardRoot);
llvm::sys::path::append(ShardRootSS, llvm::sys::path::filename(FilePath) +		llvm::sys::path::append(ShardRootSS, llvm::sys::path::filename(FilePath) +
"." + llvm::toHex(digest(FilePath)) +		"." + llvm::toHex(digest(FilePath)) +
".idx");		".idx");
return ShardRootSS.str();		return ShardRootSS.str();
}		}

		llvm::Error
		writeAtomically(llvm::StringRef OutPath,
		ilya-biryukovUnsubmitted Done Reply Inline Actions NIT: use `llvm::function_ref` here. It forces to clearly state the signature of the function and allows to avoid templates. ilya-biryukov: NIT: use `llvm::function_ref` here. It forces to clearly state the signature of the function…
		llvm::function_ref<void(llvm::raw_ostream &)> Writer) {
		// Write to a temporary file first.
		llvm::SmallString<128> TempPath;
		ilya-biryukovUnsubmitted Done Reply Inline Actions There's a helper in LLVM that will do this, `llvm::createUniqueFile()`, I believe it also tries multiple times in case of clashes. ilya-biryukov: There's a helper in LLVM that will do this, `llvm::createUniqueFile()`, I believe it also tries…
		int FD;
		auto EC =
		ilya-biryukovUnsubmitted Done Reply Inline Actions NIT: I believe there's an overloaded `operator +(StringRef, const char)` that would produce a Twine, so maybe simplify to `OutPath + ".tmp.%%%%%"`? Just a suggestion, up to you. ilya-biryukov:* NIT: I believe there's an overloaded `operator +(StringRef, const char*)` that would produce a…
		llvm::sys::fs::createUniqueFile(OutPath + ".tmp.%%%%%%%%", FD, TempPath);
		if (EC)
		return llvm::errorCodeToError(EC);
		// Make sure temp file is destroyed on failure.
		auto RemoveOnFail =
		llvm::make_scope_exit([TempPath] { llvm::sys::fs::remove(TempPath); });
		llvm::raw_fd_ostream OS(FD, /shouldClose=/true);
		Writer(OS);
		OS.close();
		if (OS.has_error())
		return llvm::errorCodeToError(OS.error());
		ilya-biryukovUnsubmitted Done Reply Inline Actions We should not remove if no error occurred, as the same name at this point can be taken by a different action. ilya-biryukov: We should not remove if no error occurred, as the same name at this point can be taken by a…
		// Then move to real location.
		EC = llvm::sys::fs::rename(TempPath, OutPath);
		if (EC)
		return llvm::errorCodeToError(EC);
		// If everything went well, we already moved the file to another name. So
		ilya-biryukovUnsubmitted Done Reply Inline Actions NIT: `s/it/the name/` ilya-biryukov: NIT: `s/it/the name/`
		// don't delete the file, as the name might be taken by another file.
		RemoveOnFail.release();
		return llvm::ErrorSuccess();
		}

// Uses disk as a storage for index shards. Creates a directory called		// Uses disk as a storage for index shards. Creates a directory called
// ".clangd-index/" under the path provided during construction.		// ".clangd-index/" under the path provided during construction.
class DiskBackedIndexStorage : public BackgroundIndexStorage {		class DiskBackedIndexStorage : public BackgroundIndexStorage {
std::string DiskShardRoot;		std::string DiskShardRoot;

public:		public:
// Sets DiskShardRoot to (Directory + ".clangd-index/") which is the base		// Sets DiskShardRoot to (Directory + ".clangd-index/") which is the base
// directory for all shard files.		// directory for all shard files.
Show All 21 Lines	loadShard(llvm::StringRef ShardIdentifier) const override {
else		else
elog("Error while reading shard {0}: {1}", ShardIdentifier,		elog("Error while reading shard {0}: {1}", ShardIdentifier,
I.takeError());		I.takeError());
return nullptr;		return nullptr;
}		}

llvm::Error storeShard(llvm::StringRef ShardIdentifier,		llvm::Error storeShard(llvm::StringRef ShardIdentifier,
IndexFileOut Shard) const override {		IndexFileOut Shard) const override {
auto ShardPath = getShardPathFromFilePath(DiskShardRoot, ShardIdentifier);		return writeAtomically(
		ilya-biryukovUnsubmitted Done Reply Inline Actions Maybe extract this into a helper function? Something like std::error_code writeAtomically(StringRef OutPath, function_ref<void(raw_ostream&)> Writer) { /// create temp file, open output stream. Writer(OS): /// Move the temp file into OutPath. } This would keep the `storeShard` function as readable as it is now ilya-biryukov: Maybe extract this into a helper function? Something like ``` std::error_code writeAtomically…
std::error_code EC;		getShardPathFromFilePath(DiskShardRoot, ShardIdentifier),
llvm::raw_fd_ostream OS(ShardPath, EC);		[&Shard](llvm::raw_ostream &OS) { OS << Shard; });
		ilya-biryukovUnsubmitted Done Reply Inline Actions Maybe create these temporary files in the same dir? That would ensure the move operations do not require transferring data between physical devices. If the output file is `/some/path/foo.bar`, we could create files named `/some/path/foo.bar.tmp#####` ilya-biryukov: Maybe create these temporary files in the same dir? That would ensure the move operations do…
if (EC)
return llvm::errorCodeToError(EC);
OS << Shard;
OS.close();
return llvm::errorCodeToError(OS.error());
}		}
};		};

// Doesn't persist index shards anywhere (used when the CDB dir is unknown).		// Doesn't persist index shards anywhere (used when the CDB dir is unknown).
// We could consider indexing into ~/.clangd/ or so instead.		// We could consider indexing into ~/.clangd/ or so instead.
class NullStorage : public BackgroundIndexStorage {		class NullStorage : public BackgroundIndexStorage {
public:		public:
std::unique_ptr<IndexFileIn>		std::unique_ptr<IndexFileIn>
▲ Show 20 Lines • Show All 50 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[clangd] Change disk-backed storage to be atomic
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 178449

clangd/index/BackgroundIndexStorage.cpp

This is an archive of the discontinued LLVM Phabricator instance.

[clangd] Change disk-backed storage to be atomicClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 178449

clangd/index/BackgroundIndexStorage.cpp

[clangd] Change disk-backed storage to be atomic
ClosedPublic