2011-08-31 13:38:22 +01:00
|
|
|
#ifndef BTREE_CHECKER_H
|
|
|
|
#define BTREE_CHECKER_H
|
2011-08-24 10:45:39 +01:00
|
|
|
|
|
|
|
#include "btree.h"
|
|
|
|
|
2011-09-16 10:06:37 +01:00
|
|
|
#include "checksum.h"
|
2011-08-24 14:27:45 +01:00
|
|
|
#include "error_set.h"
|
2011-09-16 10:06:37 +01:00
|
|
|
#include "hex_dump.h"
|
2011-08-24 14:27:45 +01:00
|
|
|
|
2011-08-24 10:45:39 +01:00
|
|
|
#include <sstream>
|
|
|
|
#include <map>
|
|
|
|
#include <set>
|
|
|
|
|
2011-08-24 14:27:45 +01:00
|
|
|
using namespace persistent_data;
|
|
|
|
using namespace std;
|
|
|
|
|
2011-08-24 10:45:39 +01:00
|
|
|
//----------------------------------------------------------------
|
|
|
|
|
|
|
|
namespace persistent_data {
|
|
|
|
//----------------------------------------------------------------
|
|
|
|
// Little helper class that keeps track of how many times blocks
|
|
|
|
// are referenced.
|
|
|
|
//----------------------------------------------------------------
|
|
|
|
class block_counter {
|
|
|
|
public:
|
2011-08-25 10:54:43 +01:00
|
|
|
typedef std::map<block_address, unsigned> count_map;
|
2011-08-24 14:27:45 +01:00
|
|
|
|
2011-08-24 10:45:39 +01:00
|
|
|
void inc(block_address b) {
|
2011-08-25 10:54:43 +01:00
|
|
|
count_map::iterator it = counts_.find(b);
|
2011-08-24 10:45:39 +01:00
|
|
|
if (it == counts_.end())
|
|
|
|
counts_.insert(make_pair(b, 1));
|
|
|
|
else
|
|
|
|
it->second++;
|
|
|
|
}
|
|
|
|
|
|
|
|
unsigned get_count(block_address b) const {
|
2011-08-24 14:27:45 +01:00
|
|
|
count_map::const_iterator it = counts_.find(b);
|
2011-08-24 10:45:39 +01:00
|
|
|
return (it == counts_.end()) ? 0 : it->second;
|
|
|
|
}
|
|
|
|
|
2011-08-24 14:27:45 +01:00
|
|
|
count_map const &get_counts() const {
|
2011-08-24 10:45:39 +01:00
|
|
|
return counts_;
|
|
|
|
}
|
|
|
|
|
|
|
|
private:
|
2011-08-24 14:27:45 +01:00
|
|
|
count_map counts_;
|
2011-08-24 10:45:39 +01:00
|
|
|
};
|
|
|
|
|
|
|
|
//----------------------------------------------------------------
|
|
|
|
// This class implements consistency checking for the btrees in
|
|
|
|
// general. Derive from this if you want some additional checks.
|
|
|
|
// It's worth summarising what is checked:
|
|
|
|
//
|
|
|
|
// Implemented
|
|
|
|
// -----------
|
|
|
|
//
|
|
|
|
// - block_nr
|
|
|
|
// - nr_entries < max_entries
|
|
|
|
// - max_entries fits in block
|
|
|
|
// - max_entries is divisible by 3
|
|
|
|
// - nr_entries > minimum (except for root nodes)
|
|
|
|
//
|
|
|
|
// Not implemented
|
|
|
|
// ---------------
|
|
|
|
//
|
|
|
|
// - checksum
|
|
|
|
// - leaf | internal flags (this can be inferred from siblings)
|
|
|
|
//----------------------------------------------------------------
|
2011-08-31 12:48:41 +01:00
|
|
|
template <uint32_t Levels, typename ValueTraits>
|
2011-08-31 13:38:22 +01:00
|
|
|
class btree_checker : public btree<Levels, ValueTraits>::visitor {
|
2011-08-24 10:45:39 +01:00
|
|
|
public:
|
2011-08-31 13:38:22 +01:00
|
|
|
btree_checker(block_counter &counter)
|
2011-08-24 14:27:45 +01:00
|
|
|
: counter_(counter),
|
|
|
|
errs_(new error_set("btree errors")) {
|
2011-08-24 10:45:39 +01:00
|
|
|
}
|
|
|
|
|
2011-09-02 11:26:42 +01:00
|
|
|
bool visit_internal(unsigned level,
|
2011-10-10 14:10:30 +01:00
|
|
|
bool sub_root,
|
2011-09-02 11:26:42 +01:00
|
|
|
optional<uint64_t> key,
|
2011-08-31 12:48:41 +01:00
|
|
|
btree_detail::node_ref<uint64_traits> const &n) {
|
2011-08-26 11:13:13 +01:00
|
|
|
if (already_visited(n))
|
|
|
|
return false;
|
|
|
|
|
2011-09-16 10:06:37 +01:00
|
|
|
check_sum(n);
|
|
|
|
|
2011-09-02 14:28:42 +01:00
|
|
|
if (!key)
|
|
|
|
new_root(level);
|
|
|
|
|
2011-08-24 10:45:39 +01:00
|
|
|
check_block_nr(n);
|
|
|
|
check_max_entries(n);
|
2011-09-02 11:26:42 +01:00
|
|
|
check_nr_entries(n, !key);
|
|
|
|
check_ordered_keys(n);
|
|
|
|
check_parent_key(key, n);
|
2011-08-26 11:13:13 +01:00
|
|
|
return true;
|
2011-08-24 10:45:39 +01:00
|
|
|
}
|
|
|
|
|
2011-09-02 11:26:42 +01:00
|
|
|
bool visit_internal_leaf(unsigned level,
|
2011-10-10 14:10:30 +01:00
|
|
|
bool sub_root,
|
2011-09-02 11:26:42 +01:00
|
|
|
optional<uint64_t> key,
|
2011-08-31 12:48:41 +01:00
|
|
|
btree_detail::node_ref<uint64_traits> const &n) {
|
2011-08-26 11:13:13 +01:00
|
|
|
if (already_visited(n))
|
|
|
|
return false;
|
|
|
|
|
2011-09-16 10:06:37 +01:00
|
|
|
check_sum(n);
|
|
|
|
|
2011-09-02 14:28:42 +01:00
|
|
|
if (!key)
|
|
|
|
new_root(level);
|
|
|
|
|
2011-08-24 10:45:39 +01:00
|
|
|
check_block_nr(n);
|
|
|
|
check_max_entries(n);
|
2011-09-02 11:26:42 +01:00
|
|
|
check_nr_entries(n, !key);
|
|
|
|
check_ordered_keys(n);
|
|
|
|
check_parent_key(key, n);
|
|
|
|
check_leaf_key(level, n);
|
2011-09-16 10:06:37 +01:00
|
|
|
|
2011-08-26 11:13:13 +01:00
|
|
|
return true;
|
2011-08-24 10:45:39 +01:00
|
|
|
}
|
|
|
|
|
2011-09-02 11:26:42 +01:00
|
|
|
bool visit_leaf(unsigned level,
|
2011-10-10 14:10:30 +01:00
|
|
|
bool sub_root,
|
2011-09-02 11:26:42 +01:00
|
|
|
optional<uint64_t> key,
|
2011-08-31 12:48:41 +01:00
|
|
|
btree_detail::node_ref<ValueTraits> const &n) {
|
2011-08-26 11:13:13 +01:00
|
|
|
if (already_visited(n))
|
|
|
|
return false;
|
|
|
|
|
2011-09-16 10:06:37 +01:00
|
|
|
check_sum(n);
|
|
|
|
|
2011-09-02 14:28:42 +01:00
|
|
|
if (!key)
|
|
|
|
new_root(level);
|
|
|
|
|
2011-08-24 10:45:39 +01:00
|
|
|
check_block_nr(n);
|
|
|
|
check_max_entries(n);
|
2011-09-02 11:26:42 +01:00
|
|
|
check_nr_entries(n, !key);
|
|
|
|
check_ordered_keys(n);
|
|
|
|
check_parent_key(key, n);
|
|
|
|
check_leaf_key(level, n);
|
2011-08-26 11:13:13 +01:00
|
|
|
return true;
|
2011-08-24 10:45:39 +01:00
|
|
|
}
|
|
|
|
|
2011-08-24 14:27:45 +01:00
|
|
|
boost::optional<error_set::ptr> get_errors() const {
|
|
|
|
return errs_;
|
|
|
|
}
|
|
|
|
|
2011-08-26 11:13:13 +01:00
|
|
|
protected:
|
|
|
|
block_counter &get_counter() {
|
|
|
|
return counter_;
|
|
|
|
}
|
|
|
|
|
2011-08-24 10:45:39 +01:00
|
|
|
private:
|
2011-08-26 11:13:13 +01:00
|
|
|
template <typename node>
|
|
|
|
bool already_visited(node const &n) {
|
|
|
|
block_address b = n.get_location();
|
|
|
|
|
|
|
|
counter_.inc(b);
|
|
|
|
|
|
|
|
if (seen_.count(b) > 0)
|
|
|
|
return true;
|
2011-08-24 10:45:39 +01:00
|
|
|
|
|
|
|
seen_.insert(b);
|
2011-08-26 11:13:13 +01:00
|
|
|
return false;
|
2011-08-24 10:45:39 +01:00
|
|
|
}
|
|
|
|
|
2011-09-16 10:06:37 +01:00
|
|
|
template <typename node>
|
|
|
|
void check_sum(node const &n) const {
|
|
|
|
crc32c sum(BTREE_CSUM_XOR);
|
|
|
|
|
|
|
|
disk_node const *data = n.raw();
|
|
|
|
sum.append(&data->header.flags, MD_BLOCK_SIZE - sizeof(uint32_t));
|
|
|
|
if (sum.get_sum() != n.get_checksum()) {
|
|
|
|
std::ostringstream out;
|
|
|
|
out << "checksum error for block " << n.get_block_nr()
|
|
|
|
<< ", sum was " << sum.get_sum()
|
|
|
|
<< ", expected " << n.get_checksum();
|
|
|
|
errs_->add_child(out.str());
|
|
|
|
throw runtime_error(out.str());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2011-08-24 10:45:39 +01:00
|
|
|
template <typename node>
|
|
|
|
void check_block_nr(node const &n) const {
|
|
|
|
if (n.get_location() != n.get_block_nr()) {
|
|
|
|
std::ostringstream out;
|
|
|
|
out << "block number mismatch: actually "
|
|
|
|
<< n.get_location()
|
|
|
|
<< ", claims " << n.get_block_nr();
|
2011-08-24 14:27:45 +01:00
|
|
|
errs_->add_child(out.str());
|
|
|
|
throw runtime_error(out.str());
|
2011-08-24 10:45:39 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
template <typename node>
|
|
|
|
void check_max_entries(node const &n) const {
|
|
|
|
size_t elt_size = sizeof(uint64_t) + n.get_value_size();
|
2011-08-31 12:48:41 +01:00
|
|
|
if (elt_size * n.get_max_entries() + sizeof(node_header) > MD_BLOCK_SIZE) {
|
2011-08-24 10:45:39 +01:00
|
|
|
std::ostringstream out;
|
|
|
|
out << "max entries too large: " << n.get_max_entries();
|
2011-08-24 14:27:45 +01:00
|
|
|
errs_->add_child(out.str());
|
2011-08-24 10:45:39 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
if (n.get_max_entries() % 3) {
|
|
|
|
std::ostringstream out;
|
|
|
|
out << "max entries is not divisible by 3: " << n.get_max_entries();
|
2011-08-24 14:27:45 +01:00
|
|
|
errs_->add_child(out.str());
|
|
|
|
throw runtime_error(out.str());
|
2011-08-24 10:45:39 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
template <typename node>
|
|
|
|
void check_nr_entries(node const &n, bool is_root) const {
|
|
|
|
if (n.get_nr_entries() > n.get_max_entries()) {
|
|
|
|
std::ostringstream out;
|
|
|
|
out << "bad nr_entries: "
|
|
|
|
<< n.get_nr_entries() << " < "
|
|
|
|
<< n.get_max_entries();
|
2011-08-24 14:27:45 +01:00
|
|
|
errs_->add_child(out.str());
|
2011-08-24 10:45:39 +01:00
|
|
|
throw std::runtime_error(out.str());
|
|
|
|
}
|
|
|
|
|
|
|
|
block_address min = n.get_max_entries() / 3;
|
|
|
|
if (!is_root && (n.get_nr_entries() < min)) {
|
|
|
|
ostringstream out;
|
|
|
|
out << "too few entries in btree: "
|
|
|
|
<< n.get_nr_entries()
|
|
|
|
<< ", expected at least "
|
|
|
|
<< min;
|
2011-08-24 14:27:45 +01:00
|
|
|
errs_->add_child(out.str());
|
2011-08-24 10:45:39 +01:00
|
|
|
throw runtime_error(out.str());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2011-09-02 11:26:42 +01:00
|
|
|
template <typename node>
|
|
|
|
void check_ordered_keys(node const &n) const {
|
|
|
|
unsigned nr_entries = n.get_nr_entries();
|
|
|
|
|
|
|
|
if (nr_entries == 0)
|
|
|
|
return; // can only happen if a root node
|
|
|
|
|
|
|
|
uint64_t last_key = n.key_at(0);
|
|
|
|
|
|
|
|
for (unsigned i = 1; i < nr_entries; i++) {
|
|
|
|
uint64_t k = n.key_at(i);
|
|
|
|
if (k <= last_key) {
|
|
|
|
ostringstream out;
|
|
|
|
out << "keys are out of order, " << k << " <= " << last_key;
|
|
|
|
throw runtime_error(out.str());
|
|
|
|
}
|
|
|
|
last_key = k;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
template <typename node>
|
|
|
|
void check_parent_key(boost::optional<uint64_t> key, node const &n) const {
|
|
|
|
if (!key)
|
|
|
|
return;
|
|
|
|
|
|
|
|
if (*key > n.key_at(0)) {
|
|
|
|
ostringstream out;
|
|
|
|
out << "parent key mismatch: parent was " << *key
|
|
|
|
<< ", but lowest in node was " << n.key_at(0);
|
|
|
|
throw runtime_error(out.str());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
template <typename node>
|
|
|
|
void check_leaf_key(unsigned level, node const &n) {
|
|
|
|
if (n.get_nr_entries() == 0)
|
|
|
|
return; // can only happen if a root node
|
|
|
|
|
|
|
|
if (last_leaf_key_[level] && *last_leaf_key_[level] >= n.key_at(0)) {
|
|
|
|
ostringstream out;
|
|
|
|
out << "the last key of the previous leaf was " << *last_leaf_key_[level]
|
|
|
|
<< " and the first key of this leaf is " << n.key_at(0);
|
|
|
|
throw runtime_error(out.str());
|
|
|
|
}
|
|
|
|
|
|
|
|
last_leaf_key_[level] = n.key_at(n.get_nr_entries() - 1);
|
|
|
|
}
|
|
|
|
|
2011-09-02 14:28:42 +01:00
|
|
|
void new_root(unsigned level) {
|
|
|
|
// we're starting a new subtree, so should
|
|
|
|
// reset the last_leaf value.
|
|
|
|
last_leaf_key_[level] = boost::optional<uint64_t>();
|
|
|
|
}
|
|
|
|
|
2011-08-24 10:45:39 +01:00
|
|
|
block_counter &counter_;
|
|
|
|
std::set<block_address> seen_;
|
2011-08-24 14:27:45 +01:00
|
|
|
error_set::ptr errs_;
|
2011-09-02 11:26:42 +01:00
|
|
|
boost::optional<uint64_t> last_leaf_key_[Levels];
|
2011-08-24 10:45:39 +01:00
|
|
|
};
|
|
|
|
}
|
|
|
|
|
|
|
|
//----------------------------------------------------------------
|
|
|
|
|
|
|
|
#endif
|