Unverified Commit 73b29188 authored by yiwu-arbug's avatar yiwu-arbug Committed by GitHub

Add clang-format script and CI job (#9)

Adding scripts/format-diff.sh to use clang-format to format code changes since diverge from master. Also adding travis CI job to check if the code needs to format. Also format all existing code.
Signed-off-by: 's avatarYi Wu <yiwu@pingcap.com>
parent 05a37557
......@@ -9,10 +9,12 @@ addons:
apt:
sources:
- ubuntu-toolchain-r-test
- llvm-toolchain-xenial-7
packages:
- g++-7
- libgflags-dev
- lcov
- clang-format-7
# For GCC build, we also report code coverage to codecov.
matrix:
......@@ -26,28 +28,31 @@ matrix:
- compiler: clang
env: SANITIZER="UBSAN"
- env: COMPILER=gcc7
- env: FORMATTER=ON
install:
- git clone --depth=1 --branch=tikv-3.0 https://github.com/pingcap/rocksdb.git
- if [ "${COMPILER}" == gcc7 ]; then
CC=gcc-7;
CXX=g++-7;
COVERAGE_OPT="-DCODE_COVERAGE=ON";
export COVERAGE_OPT="-DCODE_COVERAGE=ON";
fi
- if [ ! -z "${BUILD_TYPE}" ]; then
BUILD_OPT="-DCMAKE_BUILD_TYPE=${BUILD_TYPE}";
export BUILD_OPT="-DCMAKE_BUILD_TYPE=${BUILD_TYPE}";
else
BUILD_OPT="-DCMAKE_BUILD_TYPE=Debug";
export BUILD_OPT="-DCMAKE_BUILD_TYPE=Debug";
fi
- if [ ! -z "${SANITIZER}" ]; then
SANITIZER_OPT="-DWITH_${SANITIZER}=ON";
TOOLS_OPT="-DWITH_TITAN_TOOLS=OFF";
export SANITIZER_OPT="-DWITH_${SANITIZER}=ON";
export TOOLS_OPT="-DWITH_TITAN_TOOLS=OFF";
fi
script:
- cmake . -L -DROCKSDB_DIR=./rocksdb -DTRAVIS=ON ${BUILD_OPT} ${SANITIZER_OPT} ${TOOLS_OPT} ${COVERAGE_OPT}
- make -j4
- ctest -R titan
- if [ -z "${FORMATTER}" ]; then
bash scripts/travis-make.sh;
else
bash scripts/travis-format.sh;
fi
after_success:
- if [ "${COMPILER}" == gcc7 ]; then
......
......@@ -32,4 +32,7 @@ cmake .. -DROCKSDB_DIR=<rocksdb_source_dir> -DWITH_SNAPPY=ON
# Run tests after build. You need to filter tests by "titan" prefix.
ctest -R titan
# To format code, install clang-format and run the script.
bash scripts/format-diff.sh
```
......@@ -46,8 +46,7 @@ class TitanDB : public StackableDB {
using StackableDB::CreateColumnFamilies;
Status CreateColumnFamilies(
const ColumnFamilyOptions& options,
const std::vector<std::string>& names,
const ColumnFamilyOptions& options, const std::vector<std::string>& names,
std::vector<ColumnFamilyHandle*>* handles) override {
std::vector<TitanCFDescriptor> descs;
for (auto& name : names) {
......@@ -75,7 +74,8 @@ class TitanDB : public StackableDB {
Status DropColumnFamilies(
const std::vector<ColumnFamilyHandle*>& handles) override = 0;
Status DestroyColumnFamilyHandle(ColumnFamilyHandle* column_family) override = 0;
Status DestroyColumnFamilyHandle(ColumnFamilyHandle* column_family) override =
0;
using StackableDB::Merge;
Status Merge(const WriteOptions&, ColumnFamilyHandle*, const Slice& /*key*/,
......@@ -85,8 +85,8 @@ class TitanDB : public StackableDB {
using rocksdb::StackableDB::SingleDelete;
Status SingleDelete(const WriteOptions& /*wopts*/,
ColumnFamilyHandle* /*column_family*/,
const Slice& /*key*/) override {
ColumnFamilyHandle* /*column_family*/,
const Slice& /*key*/) override {
return Status::NotSupported("Not supported operation in titan db.");
}
......
#!/bin/bash
git diff `git merge-base master HEAD` | clang-format-diff -style=google -p1 -i
#!/bin/bash
set -ev
git fetch --depth=1 origin master:master;
git diff $(git merge-base master HEAD) HEAD > diff;
cat diff | clang-format-diff-7 -style=google -p1 > formatted;
if [ -s formatted ]; then
cat formatted;
echo "Run scripts/format-diff.sh to format your code.";
exit 1;
fi;
#!/bin/bash
set -ev
cmake . -L -DROCKSDB_DIR=./rocksdb -DTRAVIS=ON ${BUILD_OPT} ${SANITIZER_OPT} ${TOOLS_OPT} ${COVERAGE_OPT}
make -j4
ctest -R titan
#pragma once
#include "rocksdb/listener.h"
#include "db_impl.h"
#include "rocksdb/listener.h"
namespace rocksdb {
......
#pragma once
#include "util/file_reader_writer.h"
#include "blob_format.h"
#include "titan/options.h"
#include "util/file_reader_writer.h"
namespace rocksdb {
namespace titandb {
......
#include "blob_file_cache.h"
#include "util/filename.h"
#include "util.h"
#include "util/filename.h"
namespace rocksdb {
namespace titandb {
......
#pragma once
#include "rocksdb/options.h"
#include "blob_file_reader.h"
#include "blob_format.h"
#include "rocksdb/options.h"
#include "titan/options.h"
namespace rocksdb {
......
#include "blob_file_iterator.h"
#include "util/crc32c.h"
#include "util.h"
#include "util/crc32c.h"
namespace rocksdb {
namespace titandb {
......
......@@ -3,13 +3,13 @@
#include <cstdint>
#include <queue>
#include "blob_format.h"
#include "rocksdb/slice.h"
#include "rocksdb/status.h"
#include "table/internal_iterator.h"
#include "util/file_reader_writer.h"
#include "blob_format.h"
#include "titan/options.h"
#include "util.h"
#include "util/file_reader_writer.h"
namespace rocksdb {
namespace titandb {
......
......@@ -2,11 +2,11 @@
#include <cinttypes>
#include "util/filename.h"
#include "util/testharness.h"
#include "blob_file_builder.h"
#include "blob_file_cache.h"
#include "blob_file_reader.h"
#include "util/filename.h"
#include "util/testharness.h"
namespace rocksdb {
namespace titandb {
......@@ -57,7 +57,8 @@ class BlobFileIteratorTest : public testing::Test {
{
std::unique_ptr<WritableFile> f;
ASSERT_OK(env_->NewWritableFile(file_name_, &f, env_options_));
writable_file_.reset(new WritableFileWriter(std::move(f), file_name_, env_options_));
writable_file_.reset(
new WritableFileWriter(std::move(f), file_name_, env_options_));
}
builder_.reset(new BlobFileBuilder(cf_options, writable_file_.get()));
}
......
#pragma once
#include "util/file_reader_writer.h"
#include "blob_format.h"
#include "util/file_reader_writer.h"
namespace rocksdb {
namespace titandb {
......
#pragma once
#include "util/file_reader_writer.h"
#include "blob_format.h"
#include "titan/options.h"
#include "util/file_reader_writer.h"
namespace rocksdb {
namespace titandb {
......
#pragma once
#include "db_impl.h"
#include "rocksdb/listener.h"
#include "rocksdb/table_properties.h"
#include "util/coding.h"
#include "db_impl.h"
#include "version_set.h"
namespace rocksdb {
......
......@@ -40,8 +40,8 @@ class BlobFileSizeCollectorTest : public testing::Test {
void NewFileWriter(std::unique_ptr<WritableFileWriter>* result) {
std::unique_ptr<WritableFile> writable_file;
ASSERT_OK(env_->NewWritableFile(file_name_, &writable_file, env_options_));
result->reset(
new WritableFileWriter(std::move(writable_file), file_name_, env_options_));
result->reset(new WritableFileWriter(std::move(writable_file), file_name_,
env_options_));
ASSERT_TRUE(*result);
}
......
#include "util/filename.h"
#include "util/testharness.h"
#include "blob_file_builder.h"
#include "blob_file_cache.h"
#include "blob_file_reader.h"
#include "util/filename.h"
#include "util/testharness.h"
namespace rocksdb {
namespace titandb {
......@@ -31,7 +31,8 @@ class BlobFileTest : public testing::Test {
{
std::unique_ptr<WritableFile> f;
ASSERT_OK(env_->NewWritableFile(file_name_, &f, env_options_));
file.reset(new WritableFileWriter(std::move(f), file_name_, env_options_));
file.reset(
new WritableFileWriter(std::move(f), file_name_, env_options_));
}
std::unique_ptr<BlobFileBuilder> builder(
new BlobFileBuilder(cf_options, file.get()));
......@@ -91,7 +92,8 @@ class BlobFileTest : public testing::Test {
{
std::unique_ptr<WritableFile> f;
ASSERT_OK(env_->NewWritableFile(file_name_, &f, env_options_));
file.reset(new WritableFileWriter(std::move(f), file_name_, env_options_));
file.reset(
new WritableFileWriter(std::move(f), file_name_, env_options_));
}
std::unique_ptr<BlobFileBuilder> builder(
new BlobFileBuilder(cf_options, file.get()));
......
#include "blob_format.h"
#include "util/testharness.h"
#include "testutil.h"
#include "util.h"
#include "util/testharness.h"
namespace rocksdb {
namespace titandb {
......
......@@ -12,9 +12,7 @@ BlobGC::BlobGC(std::vector<BlobFileMeta*>&& blob_files,
BlobGC::~BlobGC() {}
void BlobGC::SetColumnFamily(ColumnFamilyHandle* cfh) {
cfh_ = cfh;
}
void BlobGC::SetColumnFamily(ColumnFamilyHandle* cfh) { cfh_ = cfh; }
ColumnFamilyData* BlobGC::GetColumnFamilyData() {
auto* cfhi = reinterpret_cast<ColumnFamilyHandleImpl*>(cfh_);
......
......@@ -2,8 +2,8 @@
#include <memory>
#include "db/column_family.h"
#include "blob_format.h"
#include "db/column_family.h"
#include "titan/options.h"
namespace rocksdb {
......
#pragma once
#include "db/db_impl.h"
#include "rocksdb/status.h"
#include "blob_file_builder.h"
#include "blob_file_iterator.h"
#include "blob_file_manager.h"
#include "blob_gc.h"
#include "db/db_impl.h"
#include "rocksdb/status.h"
#include "titan/options.h"
#include "version_set.h"
......
#include "blob_gc_job.h"
#include "util/testharness.h"
#include "blob_gc_picker.h"
#include "db_impl.h"
#include "util/testharness.h"
namespace rocksdb {
namespace titandb {
......@@ -42,7 +42,9 @@ class BlobGCJobTest : public testing::Test {
~BlobGCJobTest() {}
void CheckBlobNumber(int expected) {
auto b = version_set_->GetBlobStorage(base_db_->DefaultColumnFamily()->GetID()).lock();
auto b =
version_set_->GetBlobStorage(base_db_->DefaultColumnFamily()->GetID())
.lock();
ASSERT_EQ(expected, b->files_.size());
}
......@@ -80,7 +82,7 @@ class BlobGCJobTest : public testing::Test {
}
void DestroyDB() {
Status s __attribute__((__unused__)) = db_->Close();
Status s __attribute__((__unused__)) = db_->Close();
assert(s.ok());
delete db_;
db_ = nullptr;
......@@ -121,7 +123,7 @@ class BlobGCJobTest : public testing::Test {
s = blob_gc_job.Run();
mutex_->Lock();
}
if (s.ok()) {
s = blob_gc_job.Finish();
ASSERT_OK(s);
......@@ -182,12 +184,14 @@ class BlobGCJobTest : public testing::Test {
db_->Delete(WriteOptions(), GenKey(i));
}
Flush();
auto b = version_set_->GetBlobStorage(base_db_->DefaultColumnFamily()->GetID()).lock();
auto b =
version_set_->GetBlobStorage(base_db_->DefaultColumnFamily()->GetID())
.lock();
ASSERT_EQ(b->files_.size(), 1);
auto old = b->files_.begin()->first;
// for (auto& f : b->files_) {
// f.second->marked_for_sample = false;
// }
// for (auto& f : b->files_) {
// f.second->marked_for_sample = false;
// }
std::unique_ptr<BlobFileIterator> iter;
ASSERT_OK(NewIterator(b->files_.begin()->second->file_number(),
b->files_.begin()->second->file_size(), &iter));
......@@ -198,7 +202,8 @@ class BlobGCJobTest : public testing::Test {
ASSERT_TRUE(iter->key().compare(Slice(GenKey(i))) == 0);
}
RunGC();
b = version_set_->GetBlobStorage(base_db_->DefaultColumnFamily()->GetID()).lock();
b = version_set_->GetBlobStorage(base_db_->DefaultColumnFamily()->GetID())
.lock();
ASSERT_EQ(b->files_.size(), 1);
auto new1 = b->files_.begin()->first;
ASSERT_TRUE(old != new1);
......@@ -234,14 +239,15 @@ TEST_F(BlobGCJobTest, DiscardEntry) { TestDiscardEntry(); }
TEST_F(BlobGCJobTest, RunGC) { TestRunGC(); }
// Tests blob file will be kept after GC, if it is still visible by active snapshots.
// Tests blob file will be kept after GC, if it is still visible by active
// snapshots.
TEST_F(BlobGCJobTest, PurgeBlobs) {
NewDB();
auto snap1 = db_->GetSnapshot();
for (int i = 0; i < 10; i++) {
db_->Put(WriteOptions(), GenKey(i), GenValue(i));
db_->Put(WriteOptions(), GenKey(i), GenValue(i));
}
Flush();
CheckBlobNumber(1);
......@@ -254,7 +260,7 @@ TEST_F(BlobGCJobTest, PurgeBlobs) {
Flush();
CheckBlobNumber(1);
auto snap4 = db_->GetSnapshot();
RunGC();
CheckBlobNumber(1);
......@@ -264,7 +270,7 @@ TEST_F(BlobGCJobTest, PurgeBlobs) {
Flush();
auto snap5 = db_->GetSnapshot();
CheckBlobNumber(2);
db_->ReleaseSnapshot(snap2);
RunGC();
CheckBlobNumber(2);
......@@ -280,7 +286,7 @@ TEST_F(BlobGCJobTest, PurgeBlobs) {
db_->ReleaseSnapshot(snap4);
RunGC();
CheckBlobNumber(1);
db_->ReleaseSnapshot(snap5);
RunGC();
CheckBlobNumber(1);
......
......@@ -16,7 +16,8 @@ std::unique_ptr<BlobGC> BasicBlobGCPicker::PickBlobGC(
uint64_t batch_size = 0;
// ROCKS_LOG_INFO(db_options_.info_log, "blob file num:%lu gc score:%lu",
// blob_storage->NumBlobFiles(), blob_storage->gc_score().size());
// blob_storage->NumBlobFiles(),
// blob_storage->gc_score().size());
for (auto& gc_score : blob_storage->gc_score()) {
auto blob_file = blob_storage->FindFile(gc_score.file_number).lock();
assert(blob_file);
......
......@@ -2,14 +2,14 @@
#include <memory>
#include "db/column_family.h"
#include "db/write_callback.h"
#include "rocksdb/status.h"
#include "util/filename.h"
#include "blob_file_manager.h"
#include "blob_format.h"
#include "blob_gc.h"
#include "blob_storage.h"
#include "db/column_family.h"
#include "db/write_callback.h"
#include "rocksdb/status.h"
#include "util/filename.h"
namespace rocksdb {
namespace titandb {
......
#include "blob_gc_picker.h"
#include "util/filename.h"
#include "util/testharness.h"
#include "blob_file_builder.h"
#include "blob_file_cache.h"
#include "blob_file_iterator.h"
#include "blob_file_reader.h"
#include "util/filename.h"
#include "util/testharness.h"
namespace rocksdb {
namespace titandb {
......@@ -22,8 +22,10 @@ class BlobGCPickerTest : public testing::Test {
const TitanCFOptions& titan_cf_options) {
auto blob_file_cache = std::make_shared<BlobFileCache>(
titan_db_options, titan_cf_options, NewLRUCache(128));
blob_storage_.reset(new BlobStorage(titan_db_options, titan_cf_options, blob_file_cache));
basic_blob_gc_picker_.reset(new BasicBlobGCPicker(titan_db_options, titan_cf_options));
blob_storage_.reset(
new BlobStorage(titan_db_options, titan_cf_options, blob_file_cache));
basic_blob_gc_picker_.reset(
new BasicBlobGCPicker(titan_db_options, titan_cf_options));
}
void AddBlobFile(uint64_t file_number, uint64_t file_size,
......
......@@ -37,7 +37,7 @@ std::weak_ptr<BlobFileMeta> BlobStorage::FindFile(uint64_t file_number) const {
void BlobStorage::ExportBlobFiles(
std::map<uint64_t, std::weak_ptr<BlobFileMeta>>& ret) const {
ReadLock rl(&mutex_);
for(auto& kv : files_) {
for (auto& kv : files_) {
ret.emplace(kv.first, std::weak_ptr<BlobFileMeta>(kv.second));
}
}
......@@ -47,13 +47,16 @@ void BlobStorage::AddBlobFile(std::shared_ptr<BlobFileMeta>& file) {
files_.emplace(std::make_pair(file->file_number(), file));
}
void BlobStorage::MarkFileObsolete(std::shared_ptr<BlobFileMeta> file, SequenceNumber obsolete_sequence) {
void BlobStorage::MarkFileObsolete(std::shared_ptr<BlobFileMeta> file,
SequenceNumber obsolete_sequence) {
WriteLock wl(&mutex_);
obsolete_files_.push_back(std::make_pair(file->file_number(), obsolete_sequence));
obsolete_files_.push_back(
std::make_pair(file->file_number(), obsolete_sequence));
file->FileStateTransit(BlobFileMeta::FileEvent::kDelete);
}
void BlobStorage::GetObsoleteFiles(std::vector<std::string>* obsolete_files, SequenceNumber oldest_sequence) {
void BlobStorage::GetObsoleteFiles(std::vector<std::string>* obsolete_files,
SequenceNumber oldest_sequence) {
WriteLock wl(&mutex_);
for (auto it = obsolete_files_.begin(); it != obsolete_files_.end();) {
......@@ -68,14 +71,14 @@ void BlobStorage::GetObsoleteFiles(std::vector<std::string>* obsolete_files, Seq
file_cache_->Evict(file_number);
ROCKS_LOG_INFO(db_options_.info_log,
"Obsolete blob file %" PRIu64 " (obsolete at %" PRIu64
") not visible to oldest snapshot %" PRIu64 ", delete it.",
file_number, obsolete_sequence, oldest_sequence);
"Obsolete blob file %" PRIu64 " (obsolete at %" PRIu64
") not visible to oldest snapshot %" PRIu64 ", delete it.",
file_number, obsolete_sequence, oldest_sequence);
if (obsolete_files) {
obsolete_files->emplace_back(
BlobFileName(db_options_.dirname, file_number));
BlobFileName(db_options_.dirname, file_number));
}
it = obsolete_files_.erase(it);
continue;
}
......@@ -96,8 +99,7 @@ void BlobStorage::ComputeGCScore() {
gc_score_.push_back({});
auto& gcs = gc_score_.back();
gcs.file_number = file.first;
if (file.second->file_size() <
cf_options_.merge_small_file_threshold) {
if (file.second->file_size() < cf_options_.merge_small_file_threshold) {
gcs.score = 1;
} else {
gcs.score = file.second->GetDiscardableRatio();
......@@ -111,6 +113,5 @@ void BlobStorage::ComputeGCScore() {
});
}
} // namespace titandb
} // namespace rocksdb
......@@ -2,10 +2,10 @@
#include <inttypes.h>
#include "rocksdb/options.h"
#include "blob_file_cache.h"
#include "blob_format.h"
#include "blob_gc.h"
#include "rocksdb/options.h"
namespace rocksdb {
namespace titandb {
......@@ -21,12 +21,16 @@ class BlobStorage {
this->cf_options_ = bs.cf_options_;
}
BlobStorage(const TitanDBOptions& _db_options, const TitanCFOptions& _cf_options,
BlobStorage(const TitanDBOptions& _db_options,
const TitanCFOptions& _cf_options,
std::shared_ptr<BlobFileCache> _file_cache)
: db_options_(_db_options), cf_options_(_cf_options), file_cache_(_file_cache), destroyed_(false) {}
: db_options_(_db_options),
cf_options_(_cf_options),
file_cache_(_file_cache),
destroyed_(false) {}
~BlobStorage() {
for (auto& file: files_) {
for (auto& file : files_) {
file_cache_->Evict(file.second->file_number());
}
}
......@@ -45,11 +49,11 @@ class BlobStorage {
// corruption if the file doesn't exist in the specific version.
std::weak_ptr<BlobFileMeta> FindFile(uint64_t file_number) const;
std::size_t NumBlobFiles() const {
std::size_t NumBlobFiles() const {
ReadLock rl(&mutex_);
return files_.size();
return files_.size();
}
void ExportBlobFiles(
std::map<uint64_t, std::weak_ptr<BlobFileMeta>>& ret) const;
......@@ -78,9 +82,11 @@ class BlobStorage {
void AddBlobFile(std::shared_ptr<BlobFileMeta>& file);
void GetObsoleteFiles(std::vector<std::string>* obsolete_files, SequenceNumber oldest_sequence);
void GetObsoleteFiles(std::vector<std::string>* obsolete_files,
SequenceNumber oldest_sequence);
void MarkFileObsolete(std::shared_ptr<BlobFileMeta> file, SequenceNumber obsolete_sequence);
void MarkFileObsolete(std::shared_ptr<BlobFileMeta> file,
SequenceNumber obsolete_sequence);
private:
friend class VersionSet;
......@@ -92,7 +98,7 @@ class BlobStorage {
TitanDBOptions db_options_;
TitanCFOptions cf_options_;
// Read Write Mutex, which protects the `files_` structures
// Read Write Mutex, which protects the `files_` structures
mutable port::RWMutex mutex_;
// Only BlobStorage OWNS BlobFileMeta
......@@ -103,7 +109,8 @@ class BlobStorage {
std::list<std::pair<uint64_t, SequenceNumber>> obsolete_files_;
// It is marked when the column family handle is destroyed, indicating the
// in-memory data structure can be destroyed. Physical files may still be kept.
// in-memory data structure can be destroyed. Physical files may still be
// kept.
bool destroyed_;
};
......
......@@ -125,7 +125,7 @@ TitanDBImpl::TitanDBImpl(const TitanDBOptions& options,
TitanDBImpl::~TitanDBImpl() { Close(); }
// how often to schedule delete obs files periods
static constexpr uint32_t kDeleteObsoleteFilesPeriodSecs = 10; // 10s
static constexpr uint32_t kDeleteObsoleteFilesPeriodSecs = 10; // 10s
void TitanDBImpl::StartBackgroundTasks() {
if (!thread_purge_obsolete_) {
......@@ -287,7 +287,7 @@ Status TitanDBImpl::CreateColumnFamilies(
Status TitanDBImpl::DropColumnFamilies(
const std::vector<ColumnFamilyHandle*>& handles) {
std::vector<uint32_t> column_families;
for (auto& handle: handles) {
for (auto& handle : handles) {
column_families.emplace_back(handle->GetID());
}
Status s = db_impl_->DropColumnFamilies(handles);
......@@ -299,7 +299,8 @@ Status TitanDBImpl::DropColumnFamilies(
return s;
}
Status TitanDBImpl::DestroyColumnFamilyHandle(ColumnFamilyHandle* column_family) {
Status TitanDBImpl::DestroyColumnFamilyHandle(
ColumnFamilyHandle* column_family) {
auto cf_id = column_family->GetID();
Status s = db_impl_->DestroyColumnFamilyHandle(column_family);
......@@ -365,7 +366,8 @@ Status TitanDBImpl::GetImpl(const ReadOptions& options,
s = storage->Get(options, index, &record, &buffer);
if (s.IsCorruption()) {
ROCKS_LOG_DEBUG(db_options_.info_log, "Key:%s Snapshot:%" PRIu64 " GetBlobFile err:%s\n",
ROCKS_LOG_DEBUG(db_options_.info_log,
"Key:%s Snapshot:%" PRIu64 " GetBlobFile err:%s\n",
key.ToString(true).c_str(),
options.snapshot->GetSequenceNumber(),
s.ToString().c_str());
......@@ -426,14 +428,14 @@ Iterator* TitanDBImpl::NewIteratorImpl(
const ReadOptions& options, ColumnFamilyHandle* handle,
std::shared_ptr<ManagedSnapshot> snapshot) {
auto cfd = reinterpret_cast<ColumnFamilyHandleImpl*>(handle)->cfd();
mutex_.Lock();
auto storage = vset_->GetBlobStorage(handle->GetID());
mutex_.Unlock();
std::unique_ptr<ArenaWrappedDBIter> iter(db_impl_->NewIteratorImpl(
options, cfd, options.snapshot->GetSequenceNumber(), nullptr /*read_callback*/,
true /*allow_blob*/, true /*allow_refresh*/));
options, cfd, options.snapshot->GetSequenceNumber(),
nullptr /*read_callback*/, true /*allow_blob*/, true /*allow_refresh*/));
return new TitanDBIterator(options, storage.lock().get(), snapshot,
std::move(iter));
}
......@@ -456,12 +458,10 @@ Status TitanDBImpl::NewIterators(
return Status::OK();
}
const Snapshot* TitanDBImpl::GetSnapshot() {
return db_->GetSnapshot();
}
const Snapshot* TitanDBImpl::GetSnapshot() { return db_->GetSnapshot(); }
void TitanDBImpl::ReleaseSnapshot(const Snapshot* snapshot) {
// TODO:
// TODO:
// We can record here whether the oldest snapshot is released.
// If not, we can just skip the next round of purging obsolete files.
db_->ReleaseSnapshot(snapshot);
......
#pragma once
#include "blob_file_manager.h"
#include "db/db_impl.h"
#include "util/repeatable_thread.h"
#include "titan/db.h"
#include "blob_file_manager.h"
#include "util/repeatable_thread.h"
#include "version_set.h"
namespace rocksdb {
......@@ -71,6 +71,7 @@ class TitanDBImpl : public TitanDB {
void OnCompactionCompleted(const CompactionJobInfo& compaction_job_info);
void StartBackgroundTasks();
private:
class FileManager;
friend class FileManager;
......
......@@ -21,7 +21,7 @@ void TitanDBImpl::PurgeObsoleteFiles() {
for (const auto& candidate_file : candidate_files) {
ROCKS_LOG_INFO(db_options_.info_log, "Titan deleting obsolete file [%s]",
candidate_file.c_str());
candidate_file.c_str());
s = env_->DeleteFile(candidate_file);
if (!s.ok()) {
fprintf(stderr, "Titan deleting file [%s] failed, status:%s",
......
......@@ -25,7 +25,7 @@ class TitanDBIterator : public Iterator {
Status status() const override {
// assume volatile inner iter
if(status_.ok()) {
if (status_.ok()) {
return iter_->status();
} else {
return status_;
......
#pragma once
#include "table/table_builder.h"
#include "blob_file_builder.h"
#include "blob_file_manager.h"
#include "table/table_builder.h"
#include "titan/options.h"
namespace rocksdb {
......
#include "table/table_builder.h"
#include "table/table_reader.h"
#include "util/filename.h"
#include "util/testharness.h"
#include "blob_file_manager.h"
#include "blob_file_reader.h"
#include "table/table_reader.h"
#include "table_factory.h"
#include "util/filename.h"
#include "util/testharness.h"
namespace rocksdb {
namespace titandb {
......@@ -80,7 +80,8 @@ class TableBuilderTest : public testing::Test {
db_options_.dirname = tmpdir_;
cf_options_.min_blob_size = kMinBlobSize;
blob_manager_.reset(new FileManager(db_options_));
table_factory_.reset(new TitanTableFactory(db_options_, cf_options_, blob_manager_));
table_factory_.reset(
new TitanTableFactory(db_options_, cf_options_, blob_manager_));
}
~TableBuilderTest() {
......
#pragma once
#include "rocksdb/table.h"
#include "blob_file_manager.h"
#include "rocksdb/table.h"
#include "titan/options.h"
namespace rocksdb {
......
This diff is collapsed.
......@@ -14,27 +14,23 @@ class TitanTestRandomAccessFile : public RandomAccessFile {
public:
explicit TitanTestRandomAccessFile(std::unique_ptr<RandomAccessFile>&& f,
TitanFaultInjectionTestEnv* env)
: target_(std::move(f)),
env_(env) {
: target_(std::move(f)), env_(env) {
assert(target_ != nullptr);
}
virtual ~TitanTestRandomAccessFile() { }
virtual ~TitanTestRandomAccessFile() {}
Status Read(uint64_t offset, size_t n, Slice* result,
char* scratch) const override;
Status Prefetch(uint64_t offset, size_t n) override;
size_t GetUniqueId(char* id, size_t max_size) const override {
return target_->GetUniqueId(id, max_size);
}
void Hint(AccessPattern pattern) override {
return target_->Hint(pattern);
}
bool use_direct_io() const override {
return target_->use_direct_io();
}
void Hint(AccessPattern pattern) override { return target_->Hint(pattern); }
bool use_direct_io() const override { return target_->use_direct_io(); }
size_t GetRequiredBufferAlignment() const override {
return target_->GetRequiredBufferAlignment();
}
Status InvalidateCache(size_t offset, size_t length) override;
private:
std::unique_ptr<RandomAccessFile> target_;
TitanFaultInjectionTestEnv* env_;
......@@ -42,9 +38,8 @@ class TitanTestRandomAccessFile : public RandomAccessFile {
class TitanFaultInjectionTestEnv : public FaultInjectionTestEnv {
public:
TitanFaultInjectionTestEnv(Env* t)
: FaultInjectionTestEnv(t) { }
virtual ~TitanFaultInjectionTestEnv() { }
TitanFaultInjectionTestEnv(Env* t) : FaultInjectionTestEnv(t) {}
virtual ~TitanFaultInjectionTestEnv() {}
Status NewRandomAccessFile(const std::string& fname,
std::unique_ptr<RandomAccessFile>* result,
const EnvOptions& soptions) {
......@@ -59,27 +54,28 @@ class TitanFaultInjectionTestEnv : public FaultInjectionTestEnv {
}
};
Status TitanTestRandomAccessFile::Read(uint64_t offset, size_t n,
Slice* result, char* scratch) const {
if(!env_->IsFilesystemActive()) {
Status TitanTestRandomAccessFile::Read(uint64_t offset, size_t n, Slice* result,
char* scratch) const {
if (!env_->IsFilesystemActive()) {
return env_->GetError();
}
return target_->Read(offset, n, result, scratch);
}
Status TitanTestRandomAccessFile::Prefetch(uint64_t offset, size_t n) {
if(!env_->IsFilesystemActive()) {
if (!env_->IsFilesystemActive()) {
return env_->GetError();
}
return target_->Prefetch(offset, n);
}
Status TitanTestRandomAccessFile::InvalidateCache(size_t offset, size_t length) {
if(!env_->IsFilesystemActive()) {
Status TitanTestRandomAccessFile::InvalidateCache(size_t offset,
size_t length) {
if (!env_->IsFilesystemActive()) {
return env_->GetError();
}
return target_->InvalidateCache(offset, length);
}
} // namespace titandb
} // namespace rocksdb
\ No newline at end of file
} // namespace titandb
} // namespace rocksdb
\ No newline at end of file
......@@ -2,8 +2,8 @@
#include <set>
#include "rocksdb/slice.h"
#include "blob_format.h"
#include "rocksdb/slice.h"
namespace rocksdb {
namespace titandb {
......@@ -21,7 +21,8 @@ class VersionEdit {
added_files_.push_back(file);
}
void DeleteBlobFile(uint64_t file_number, SequenceNumber obsolete_sequence = 0) {
void DeleteBlobFile(uint64_t file_number,
SequenceNumber obsolete_sequence = 0) {
deleted_files_.emplace_back(std::make_pair(file_number, obsolete_sequence));
}
......
......@@ -210,10 +210,10 @@ Status VersionSet::Apply(VersionEdit* edit) {
auto cf_id = edit->column_family_id_;
auto it = column_families_.find(cf_id);
if (it == column_families_.end()) {
// TODO: support OpenForReadOnly which doesn't open DB with all column family
// so there are maybe some invalid column family, but we can't just skip it
// otherwise blob files of the non-open column families will be regarded as
// obsolete and deleted.
// TODO: support OpenForReadOnly which doesn't open DB with all column
// family so there are maybe some invalid column family, but we can't just
// skip it otherwise blob files of the non-open column families will be
// regarded as obsolete and deleted.
return Status::OK();
}
auto& files = it->second->files_;
......@@ -225,7 +225,8 @@ Status VersionSet::Apply(VersionEdit* edit) {
fprintf(stderr, "blob file %" PRIu64 " doesn't exist before\n", number);
abort();
} else if (blob_it->second->is_obsolete()) {
fprintf(stderr, "blob file %" PRIu64 " has been deleted before\n", number);
fprintf(stderr, "blob file %" PRIu64 " has been deleted before\n",
number);
abort();
}
it->second->MarkFileObsolete(blob_it->second, file.second);
......@@ -236,9 +237,11 @@ Status VersionSet::Apply(VersionEdit* edit) {
auto blob_it = files.find(number);
if (blob_it != files.end()) {
if (blob_it->second->is_obsolete()) {
fprintf(stderr, "blob file %" PRIu64 " has been deleted before\n", number);
fprintf(stderr, "blob file %" PRIu64 " has been deleted before\n",
number);
} else {
fprintf(stderr, "blob file %" PRIu64 " has been added before\n", number);
fprintf(stderr, "blob file %" PRIu64 " has been added before\n",
number);
}
abort();
}
......@@ -249,37 +252,41 @@ Status VersionSet::Apply(VersionEdit* edit) {
return Status::OK();
}
void VersionSet::AddColumnFamilies(const std::map<uint32_t, TitanCFOptions>& column_families) {
void VersionSet::AddColumnFamilies(
const std::map<uint32_t, TitanCFOptions>& column_families) {
for (auto& cf : column_families) {
auto file_cache =
std::make_shared<BlobFileCache>(db_options_, cf.second, file_cache_);
auto blob_storage = std::make_shared<BlobStorage>(db_options_, cf.second, file_cache);
auto blob_storage =
std::make_shared<BlobStorage>(db_options_, cf.second, file_cache);
column_families_.emplace(cf.first, blob_storage);
}
}
Status VersionSet::DropColumnFamilies(const std::vector<uint32_t>& column_families, SequenceNumber obsolete_sequence) {
Status VersionSet::DropColumnFamilies(
const std::vector<uint32_t>& column_families,
SequenceNumber obsolete_sequence) {
Status s;
for (auto& cf_id : column_families) {
auto it = column_families_.find(cf_id);
if (it != column_families_.end()) {
VersionEdit edit;
edit.SetColumnFamilyID(it->first);
for (auto& file: it->second->files_) {
for (auto& file : it->second->files_) {
ROCKS_LOG_INFO(db_options_.info_log, "Titan add obsolete file [%llu]",
file.second->file_number());
file.second->file_number());
edit.DeleteBlobFile(file.first, obsolete_sequence);
}
s = LogAndApply(&edit);
if (!s.ok()) return s;
} else {
ROCKS_LOG_ERROR(db_options_.info_log,
"column %u not found for drop\n", cf_id);
ROCKS_LOG_ERROR(db_options_.info_log, "column %u not found for drop\n",
cf_id);
return Status::NotFound("invalid column family");
}
obsolete_columns_.insert(cf_id);
}
return s;
}
return s;
}
Status VersionSet::DestroyColumnFamily(uint32_t cf_id) {
......@@ -292,25 +299,27 @@ Status VersionSet::DestroyColumnFamily(uint32_t cf_id) {
}
return Status::OK();
}
ROCKS_LOG_ERROR(db_options_.info_log,
"column %u not found for destroy\n", cf_id);
ROCKS_LOG_ERROR(db_options_.info_log, "column %u not found for destroy\n",
cf_id);
return Status::NotFound("invalid column family");
}
void VersionSet::GetObsoleteFiles(std::vector<std::string>* obsolete_files, SequenceNumber oldest_sequence) {
void VersionSet::GetObsoleteFiles(std::vector<std::string>* obsolete_files,
SequenceNumber oldest_sequence) {
for (auto it = column_families_.begin(); it != column_families_.end();) {
auto& cf_id = it->first;
auto& blob_storage = it->second;
// In the case of dropping column family, obsolete blob files can be deleted only
// after the column family handle is destroyed.
// In the case of dropping column family, obsolete blob files can be deleted
// only after the column family handle is destroyed.
if (obsolete_columns_.find(cf_id) != obsolete_columns_.end()) {
++it;
continue;
}
blob_storage->GetObsoleteFiles(obsolete_files, oldest_sequence);
// Cleanup obsolete column family when all the blob files for that are deleted.
// Cleanup obsolete column family when all the blob files for that are
// deleted.
if (blob_storage->MaybeRemove()) {
it = column_families_.erase(it);
continue;
......@@ -318,7 +327,8 @@ void VersionSet::GetObsoleteFiles(std::vector<std::string>* obsolete_files, Sequ
++it;
}
obsolete_files->insert(obsolete_files->end(), obsolete_manifests_.begin(), obsolete_manifests_.end());
obsolete_files->insert(obsolete_files->end(), obsolete_manifests_.begin(),
obsolete_manifests_.end());
obsolete_manifests_.clear();
}
......
......@@ -5,16 +5,16 @@
#include <unordered_map>
#include <unordered_set>
#include "blob_file_cache.h"
#include "blob_storage.h"
#include "db/log_reader.h"
#include "db/log_writer.h"
#include "port/port_posix.h"
#include "rocksdb/options.h"
#include "rocksdb/status.h"
#include "util/mutexlock.h"
#include "blob_file_cache.h"
#include "titan/options.h"
#include "util/mutexlock.h"
#include "version_edit.h"
#include "blob_storage.h"
namespace rocksdb {
namespace titandb {
......@@ -43,7 +43,8 @@ class VersionSet {
// Drops some column families. The obsolete files will be deleted in
// background when they will not be accessed anymore.
// REQUIRES: mutex is held
Status DropColumnFamilies(const std::vector<uint32_t>& handles, SequenceNumber obsolete_sequence);
Status DropColumnFamilies(const std::vector<uint32_t>& handles,
SequenceNumber obsolete_sequence);
// Destroy the column family. Only after this is called, the obsolete files
// of the dropped column family can be physical deleted.
......@@ -63,7 +64,8 @@ class VersionSet {
}
// REQUIRES: mutex is held
void GetObsoleteFiles(std::vector<std::string>* obsolete_files, SequenceNumber oldest_sequence);
void GetObsoleteFiles(std::vector<std::string>* obsolete_files,
SequenceNumber oldest_sequence);
// REQUIRES: mutex is held
void MarkAllFilesForGC() {
......@@ -71,6 +73,7 @@ class VersionSet {
cf.second->MarkAllFilesForGC();
}
}
private:
friend class BlobFileSizeCollectorTest;
friend class VersionTest;
......@@ -80,7 +83,7 @@ class VersionSet {
Status OpenManifest(uint64_t number);
Status WriteSnapshot(log::Writer* log);
Status Apply(VersionEdit* edit);
std::string dirname_;
......@@ -91,10 +94,12 @@ class VersionSet {
std::vector<std::string> obsolete_manifests_;
// As rocksdb described, `DropColumnFamilies()` only records the drop of the column family specified by ColumnFamilyHandle.
// The actual data is not deleted until the client calls `delete column_family`, namely `DestroyColumnFamilyHandle()`.
// We can still continue using the column family if we have outstanding ColumnFamilyHandle pointer.
// So here record the dropped column family but the handler is not destroyed.
// As rocksdb described, `DropColumnFamilies()` only records the drop of the
// column family specified by ColumnFamilyHandle. The actual data is not
// deleted until the client calls `delete column_family`, namely
// `DestroyColumnFamilyHandle()`. We can still continue using the column
// family if we have outstanding ColumnFamilyHandle pointer. So here record
// the dropped column family but the handler is not destroyed.
std::unordered_set<uint32_t> obsolete_columns_;
std::unordered_map<uint32_t, std::shared_ptr<BlobStorage>> column_families_;
......
#include "util/filename.h"
#include "util/testharness.h"
#include "testutil.h"
#include "util.h"
#include "util/filename.h"
#include "util/testharness.h"
#include "version_edit.h"
#include "version_set.h"
......@@ -82,7 +82,7 @@ class VersionTest : public testing::Test {
auto& storage = column_families_[it.first];
// ignore obsolete file
auto size = 0;
for (auto& file: it.second->files_) {
for (auto& file : it.second->files_) {
if (!file.second->is_obsolete()) {
size++;
}
......@@ -198,7 +198,7 @@ TEST_F(VersionTest, ObsoleteFiles) {
std::vector<uint32_t> cfs = {1};
ASSERT_OK(vset_->DropColumnFamilies(cfs, 0));
vset_->GetObsoleteFiles(&of, kMaxSequenceNumber);
ASSERT_EQ(of.size(), 1);
ASSERT_EQ(of.size(), 1);
CheckColumnFamiliesSize(10);
ASSERT_OK(vset_->DestroyColumnFamily(1));
......
This diff is collapsed.
This diff is collapsed.
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment