2019-09-07 10:03:22 +00:00
|
|
|
/*
|
|
|
|
This file is part of TON Blockchain Library.
|
|
|
|
|
|
|
|
TON Blockchain Library is free software: you can redistribute it and/or modify
|
|
|
|
it under the terms of the GNU Lesser General Public License as published by
|
|
|
|
the Free Software Foundation, either version 2 of the License, or
|
|
|
|
(at your option) any later version.
|
|
|
|
|
|
|
|
TON Blockchain Library is distributed in the hope that it will be useful,
|
|
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
GNU Lesser General Public License for more details.
|
|
|
|
|
|
|
|
You should have received a copy of the GNU Lesser General Public License
|
|
|
|
along with TON Blockchain Library. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
|
2020-03-23 23:32:16 +00:00
|
|
|
Copyright 2017-2020 Telegram Systems LLP
|
2019-09-07 10:03:22 +00:00
|
|
|
*/
|
|
|
|
#include "td/db/RocksDb.h"
|
|
|
|
|
|
|
|
#include "rocksdb/db.h"
|
2019-12-12 15:16:25 +00:00
|
|
|
#include "rocksdb/table.h"
|
2019-09-07 10:03:22 +00:00
|
|
|
#include "rocksdb/statistics.h"
|
|
|
|
#include "rocksdb/write_batch.h"
|
|
|
|
#include "rocksdb/utilities/optimistic_transaction_db.h"
|
|
|
|
#include "rocksdb/utilities/transaction.h"
|
|
|
|
|
|
|
|
namespace td {
|
|
|
|
namespace {
|
|
|
|
static Status from_rocksdb(rocksdb::Status status) {
|
|
|
|
if (status.ok()) {
|
|
|
|
return Status::OK();
|
|
|
|
}
|
|
|
|
return Status::Error(status.ToString());
|
|
|
|
}
|
|
|
|
static Slice from_rocksdb(rocksdb::Slice slice) {
|
|
|
|
return Slice(slice.data(), slice.size());
|
|
|
|
}
|
|
|
|
static rocksdb::Slice to_rocksdb(Slice slice) {
|
|
|
|
return rocksdb::Slice(slice.data(), slice.size());
|
|
|
|
}
|
|
|
|
} // namespace
|
|
|
|
|
|
|
|
Status RocksDb::destroy(Slice path) {
|
|
|
|
return from_rocksdb(rocksdb::DestroyDB(path.str(), {}));
|
|
|
|
}
|
|
|
|
|
|
|
|
RocksDb::RocksDb(RocksDb &&) = default;
|
|
|
|
RocksDb &RocksDb::operator=(RocksDb &&) = default;
|
|
|
|
|
|
|
|
RocksDb::~RocksDb() {
|
|
|
|
if (!db_) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
end_snapshot().ensure();
|
|
|
|
}
|
|
|
|
|
|
|
|
RocksDb RocksDb::clone() const {
|
|
|
|
return RocksDb{db_, statistics_};
|
|
|
|
}
|
|
|
|
|
|
|
|
Result<RocksDb> RocksDb::open(std::string path) {
|
|
|
|
rocksdb::OptimisticTransactionDB *db;
|
|
|
|
auto statistics = rocksdb::CreateDBStatistics();
|
|
|
|
{
|
|
|
|
rocksdb::Options options;
|
2019-12-12 15:16:25 +00:00
|
|
|
|
|
|
|
static auto cache = rocksdb::NewLRUCache(1 << 30);
|
|
|
|
|
|
|
|
rocksdb::BlockBasedTableOptions table_options;
|
|
|
|
table_options.block_cache = cache;
|
|
|
|
options.table_factory.reset(rocksdb::NewBlockBasedTableFactory(table_options));
|
|
|
|
|
2019-09-07 10:03:22 +00:00
|
|
|
options.manual_wal_flush = true;
|
|
|
|
options.create_if_missing = true;
|
|
|
|
options.max_background_compactions = 4;
|
|
|
|
options.max_background_flushes = 2;
|
|
|
|
options.bytes_per_sync = 1 << 20;
|
|
|
|
options.writable_file_max_buffer_size = 2 << 14;
|
|
|
|
options.statistics = statistics;
|
2020-04-27 12:01:46 +00:00
|
|
|
rocksdb::OptimisticTransactionDBOptions occ_options;
|
|
|
|
occ_options.validate_policy = rocksdb::OccValidationPolicy::kValidateSerial;
|
|
|
|
rocksdb::ColumnFamilyOptions cf_options(options);
|
|
|
|
std::vector<rocksdb::ColumnFamilyDescriptor> column_families;
|
|
|
|
column_families.push_back(rocksdb::ColumnFamilyDescriptor(rocksdb::kDefaultColumnFamilyName, cf_options));
|
|
|
|
std::vector<rocksdb::ColumnFamilyHandle *> handles;
|
|
|
|
TRY_STATUS(from_rocksdb(
|
|
|
|
rocksdb::OptimisticTransactionDB::Open(options, occ_options, std::move(path), column_families, &handles, &db)));
|
|
|
|
CHECK(handles.size() == 1);
|
|
|
|
// i can delete the handle since DBImpl is always holding a reference to
|
|
|
|
// default column family
|
|
|
|
delete handles[0];
|
2019-09-07 10:03:22 +00:00
|
|
|
}
|
|
|
|
return RocksDb(std::shared_ptr<rocksdb::OptimisticTransactionDB>(db), std::move(statistics));
|
|
|
|
}
|
|
|
|
|
|
|
|
std::unique_ptr<KeyValueReader> RocksDb::snapshot() {
|
|
|
|
auto res = std::make_unique<RocksDb>(clone());
|
|
|
|
res->begin_snapshot().ensure();
|
|
|
|
return std::move(res);
|
|
|
|
}
|
|
|
|
|
|
|
|
std::string RocksDb::stats() const {
|
2019-12-12 15:16:25 +00:00
|
|
|
std::string out;
|
|
|
|
db_->GetProperty("rocksdb.stats", &out);
|
|
|
|
//db_->GetProperty("rocksdb.cur-size-all-mem-tables", &out);
|
|
|
|
return out;
|
2019-09-07 10:03:22 +00:00
|
|
|
return statistics_->ToString();
|
|
|
|
}
|
|
|
|
|
|
|
|
Result<RocksDb::GetStatus> RocksDb::get(Slice key, std::string &value) {
|
|
|
|
//LOG(ERROR) << "GET";
|
|
|
|
rocksdb::Status status;
|
|
|
|
if (snapshot_) {
|
|
|
|
rocksdb::ReadOptions options;
|
|
|
|
options.snapshot = snapshot_.get();
|
|
|
|
status = db_->Get(options, to_rocksdb(key), &value);
|
|
|
|
} else if (transaction_) {
|
|
|
|
status = transaction_->Get({}, to_rocksdb(key), &value);
|
|
|
|
} else {
|
|
|
|
status = db_->Get({}, to_rocksdb(key), &value);
|
|
|
|
}
|
|
|
|
if (status.ok()) {
|
|
|
|
return GetStatus::Ok;
|
|
|
|
}
|
|
|
|
if (status.code() == rocksdb::Status::kNotFound) {
|
|
|
|
return GetStatus::NotFound;
|
|
|
|
}
|
|
|
|
return from_rocksdb(status);
|
|
|
|
}
|
|
|
|
|
|
|
|
Status RocksDb::set(Slice key, Slice value) {
|
|
|
|
if (write_batch_) {
|
|
|
|
return from_rocksdb(write_batch_->Put(to_rocksdb(key), to_rocksdb(value)));
|
|
|
|
}
|
|
|
|
if (transaction_) {
|
|
|
|
return from_rocksdb(transaction_->Put(to_rocksdb(key), to_rocksdb(value)));
|
|
|
|
}
|
|
|
|
return from_rocksdb(db_->Put({}, to_rocksdb(key), to_rocksdb(value)));
|
|
|
|
}
|
|
|
|
|
|
|
|
Status RocksDb::erase(Slice key) {
|
|
|
|
if (write_batch_) {
|
|
|
|
return from_rocksdb(write_batch_->Delete(to_rocksdb(key)));
|
|
|
|
}
|
|
|
|
if (transaction_) {
|
|
|
|
return from_rocksdb(transaction_->Delete(to_rocksdb(key)));
|
|
|
|
}
|
|
|
|
return from_rocksdb(db_->Delete({}, to_rocksdb(key)));
|
|
|
|
}
|
|
|
|
|
|
|
|
Result<size_t> RocksDb::count(Slice prefix) {
|
|
|
|
rocksdb::ReadOptions options;
|
|
|
|
options.snapshot = snapshot_.get();
|
|
|
|
std::unique_ptr<rocksdb::Iterator> iterator;
|
|
|
|
if (snapshot_ || !transaction_) {
|
|
|
|
iterator.reset(db_->NewIterator(options));
|
|
|
|
} else {
|
|
|
|
iterator.reset(transaction_->GetIterator(options));
|
|
|
|
}
|
|
|
|
|
|
|
|
size_t res = 0;
|
|
|
|
for (iterator->Seek(to_rocksdb(prefix)); iterator->Valid(); iterator->Next()) {
|
|
|
|
if (from_rocksdb(iterator->key()).truncate(prefix.size()) != prefix) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
res++;
|
|
|
|
}
|
|
|
|
if (!iterator->status().ok()) {
|
|
|
|
return from_rocksdb(iterator->status());
|
|
|
|
}
|
|
|
|
return res;
|
|
|
|
}
|
|
|
|
|
2020-04-27 12:01:46 +00:00
|
|
|
Status RocksDb::begin_write_batch() {
|
|
|
|
CHECK(!transaction_);
|
|
|
|
write_batch_ = std::make_unique<rocksdb::WriteBatch>();
|
|
|
|
return Status::OK();
|
|
|
|
}
|
|
|
|
|
2019-09-07 10:03:22 +00:00
|
|
|
Status RocksDb::begin_transaction() {
|
2020-04-27 12:01:46 +00:00
|
|
|
CHECK(!write_batch_);
|
2019-09-07 10:03:22 +00:00
|
|
|
rocksdb::WriteOptions options;
|
|
|
|
options.sync = true;
|
2020-03-23 23:32:16 +00:00
|
|
|
transaction_.reset(db_->BeginTransaction(options, {}));
|
2019-09-07 10:03:22 +00:00
|
|
|
return Status::OK();
|
2020-03-23 23:32:16 +00:00
|
|
|
}
|
2019-09-07 10:03:22 +00:00
|
|
|
|
2020-04-27 12:01:46 +00:00
|
|
|
Status RocksDb::commit_write_batch() {
|
|
|
|
CHECK(write_batch_);
|
|
|
|
auto write_batch = std::move(write_batch_);
|
|
|
|
rocksdb::WriteOptions options;
|
|
|
|
options.sync = true;
|
|
|
|
return from_rocksdb(db_->Write(options, write_batch.get()));
|
|
|
|
}
|
2020-03-23 23:32:16 +00:00
|
|
|
|
2020-04-27 12:01:46 +00:00
|
|
|
Status RocksDb::commit_transaction() {
|
2020-03-23 23:32:16 +00:00
|
|
|
CHECK(transaction_);
|
2020-04-27 12:01:46 +00:00
|
|
|
auto transaction = std::move(transaction_);
|
|
|
|
return from_rocksdb(transaction->Commit());
|
|
|
|
}
|
|
|
|
|
|
|
|
Status RocksDb::abort_write_batch() {
|
|
|
|
CHECK(write_batch_);
|
|
|
|
write_batch_.reset();
|
|
|
|
return Status::OK();
|
2019-09-07 10:03:22 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
Status RocksDb::abort_transaction() {
|
2020-03-23 23:32:16 +00:00
|
|
|
CHECK(transaction_);
|
|
|
|
transaction_.reset();
|
2019-09-07 10:03:22 +00:00
|
|
|
return Status::OK();
|
|
|
|
}
|
|
|
|
|
|
|
|
Status RocksDb::flush() {
|
|
|
|
return from_rocksdb(db_->Flush({}));
|
|
|
|
}
|
|
|
|
|
|
|
|
Status RocksDb::begin_snapshot() {
|
|
|
|
snapshot_.reset(db_->GetSnapshot());
|
|
|
|
return td::Status::OK();
|
|
|
|
}
|
|
|
|
|
|
|
|
Status RocksDb::end_snapshot() {
|
|
|
|
if (snapshot_) {
|
|
|
|
db_->ReleaseSnapshot(snapshot_.release());
|
|
|
|
}
|
|
|
|
return td::Status::OK();
|
|
|
|
}
|
|
|
|
|
|
|
|
RocksDb::RocksDb(std::shared_ptr<rocksdb::OptimisticTransactionDB> db, std::shared_ptr<rocksdb::Statistics> statistics)
|
|
|
|
: db_(std::move(db)), statistics_(std::move(statistics)) {
|
|
|
|
}
|
|
|
|
} // namespace td
|