#ifndef SPACE_MAP_DISK_H #define SPACE_MAP_DISK_H #include "space_map.h" #include "transaction_manager.h" #include "endian.h" #include "space_map_disk_structures.h" #include "math.h" //---------------------------------------------------------------- namespace persistent_data { namespace sm_disk_detail { using namespace base; using namespace persistent_data; template class bitmap { public: bitmap(typename transaction_manager::ptr tm, index_entry const &ie) : tm_(tm), ie_(ie) { } ref_t lookup(unsigned b) const { auto rr = tm_->read_lock(ie_.blocknr_); void const *bits = bitmap_data(rr); ref_t b1 = test_bit_le(bits, b * 2); ref_t b2 = test_bit_le(bits, b * 2 + 1); ref_t result = b2 ? 1 : 0; result |= b1 ? 0b10 : 0; return result; } void insert(unsigned b, ref_t n) { auto wr = tm_->shadow(ie_.blocknr_).first; void *bits = bitmap_data(wr); bool was_free = !test_bit_le(bits, b * 2) && !test_bit_le(bits, b * 2 + 1); if (n == 1 || n == 3) set_bit_le(bits, b * 2 + 1); else clear_bit_le(bits, b * 2 + 1); if (n == 2 || n == 3) set_bit_le(bits, b * 2); else clear_bit_le(bits, b * 2); ie_.blocknr_ = wr.get_location(); if (was_free && n > 0) { ie_.nr_free_--; if (b == ie_.none_free_before_) ie_.none_free_before_++; } if (!was_free && n == 0) { ie_.nr_free_++; if (b < ie_.none_free_before_) ie_.none_free_before_ = b; } } unsigned find_free(unsigned end) { for (unsigned i = ie_.none_free_before_; i < end; i++) { if (lookup(i) == 0) { insert(i, 1); ie_.none_free_before_ = i + 1; return i; } } throw std::runtime_error("no free entry in bitmap"); } index_entry const &get_ie() const { return ie_; } private: void *bitmap_data(typename transaction_manager::write_ref &wr) { bitmap_header *h = reinterpret_cast(&wr.data()[0]); return h + 1; } void const *bitmap_data(typename transaction_manager::read_ref &rr) const { bitmap_header const *h = reinterpret_cast(&rr.data()[0]); return h + 1; } typename transaction_manager::ptr tm_; index_entry ie_; }; struct ref_count_traits { typedef __le32 disk_type; typedef uint32_t value_type; typedef NoOpRefCounter ref_counter; static void unpack(disk_type const &d, value_type &v) { v = to_cpu(d); } static void pack(value_type const &v, disk_type &d) { d = to_disk(v); } }; template class sm_disk_base : public persistent_space_map { public: typedef boost::shared_ptr > ptr; sm_disk_base(typename transaction_manager::ptr tm) : tm_(tm), entries_per_block_((BlockSize - sizeof(bitmap_header)) * 4), nr_blocks_(0), nr_allocated_(0), ref_counts_(tm_, ref_count_traits::ref_counter()) { } sm_disk_base(typename transaction_manager::ptr tm, sm_root const &root) : tm_(tm), nr_blocks_(root.nr_blocks_), nr_allocated_(root.nr_allocated_), ref_counts_(tm_, root.ref_count_root_, ref_count_traits::ref_counter()) { } block_address get_nr_blocks() const { return nr_blocks_; } block_address get_nr_free() const { return nr_blocks_ - nr_allocated_; } ref_t get_count(block_address b) const { auto count = lookup_bitmap(b); if (count == 3) return lookup_ref_count(b); return count; } void set_count(block_address b, ref_t c) { ref_t old = get_count(b); if (c == old) return; if (c > 2) { if (old < 3) insert_bitmap(b, 3); insert_ref_count(b, c); } else { if (old > 2) remove_ref_count(b); insert_bitmap(b, c); } if (old == 0) nr_allocated_++; else if (c == 0) nr_allocated_--; } void commit() { } void inc(block_address b) { // FIXME: 2 get_counts ref_t old = get_count(b); set_count(b, old + 1); } void dec(block_address b) { ref_t old = get_count(b); set_count(b, old - 1); } block_address new_block() { // silly to always start searching from the // beginning. block_address nr_indexes = div_up(nr_blocks_, entries_per_block_); for (block_address index = 0; index < nr_indexes; index++) { auto ie = find_ie(index); bitmap bm(tm_, ie); block_address b = bm.find_free((index == nr_indexes - 1) ? nr_blocks_ % entries_per_block_ : entries_per_block_); save_ie(b, bm.get_ie()); nr_allocated_++; b = (index * entries_per_block_) + b; assert(get_count(b) == 1); return b; } throw runtime_error("out of space"); } bool count_possibly_greater_than_one(block_address b) const { return get_count(b) > 1; } virtual void extend(block_address extra_blocks) { block_address nr_blocks = nr_blocks_ + extra_blocks; block_address bitmap_count = div_up(nr_blocks, entries_per_block_); block_address old_bitmap_count = div_up(nr_blocks_, entries_per_block_); for (block_address i = old_bitmap_count; i < bitmap_count; i++) { auto wr = tm_->new_block(); struct index_entry ie; ie.blocknr_ = wr.get_location(); ie.nr_free_ = i == (bitmap_count - 1) ? (nr_blocks % entries_per_block_) : entries_per_block_; ie.none_free_before_ = 0; save_ie(i, ie); } nr_blocks_ = nr_blocks; } protected: typename transaction_manager::ptr get_tm() const { return tm_; } block_address get_nr_allocated() const { return nr_allocated_; } block_address get_ref_count_root() const { return ref_counts_.get_root(); } unsigned get_entries_per_block() const { return entries_per_block_; } private: virtual index_entry find_ie(block_address b) const = 0; virtual void save_ie(block_address b, struct index_entry ie) = 0; ref_t lookup_bitmap(block_address b) const { index_entry ie = find_ie(b); bitmap bm(tm_, ie); return bm.lookup(b % entries_per_block_); } void insert_bitmap(block_address b, unsigned n) { if (n > 3) throw runtime_error("bitmap can only hold 2 bit values"); auto ie = find_ie(b); bitmap bm(tm_, ie); bm.insert(b % entries_per_block_, n); save_ie(b, bm.get_ie()); } ref_t lookup_ref_count(block_address b) const { uint64_t key[1] = {b}; auto mvalue = ref_counts_.lookup(key); if (!mvalue) throw runtime_error("ref count not in tree"); return *mvalue; } void insert_ref_count(block_address b, ref_t count) { uint64_t key[1] = {b}; ref_counts_.insert(key, count); } void remove_ref_count(block_address b) { uint64_t key[1] = {b}; ref_counts_.remove(key); } typename transaction_manager::ptr tm_; uint32_t entries_per_block_; block_address nr_blocks_; block_address nr_allocated_; btree<1, ref_count_traits, BlockSize> ref_counts_; }; template class sm_disk : public sm_disk_base { public: typedef boost::shared_ptr > ptr; sm_disk(typename transaction_manager::ptr tm) : sm_disk_base(tm), bitmaps_(sm_disk_base::get_tm(), typename sm_disk_detail::index_entry_traits::ref_counter()) { } sm_disk(typename transaction_manager::ptr tm, sm_root const &root) : sm_disk_base(tm, root), bitmaps_(sm_disk_base::get_tm(), root.bitmap_root_, typename sm_disk_detail::index_entry_traits::ref_counter()) { } size_t root_size() { return sizeof(sm_root_disk); } void copy_root(void *dest, size_t len) { sm_root_disk d; sm_root v; if (len < sizeof(d)) throw runtime_error("root too small"); v.nr_blocks_ = sm_disk_base::get_nr_blocks(); v.nr_allocated_ = sm_disk_base::get_nr_allocated(); v.bitmap_root_ = bitmaps_.get_root(); v.ref_count_root_ = sm_disk_base::get_ref_count_root(); sm_root_traits::pack(v, d); ::memcpy(dest, &d, sizeof(d)); } private: index_entry find_ie(block_address b) const { uint64_t key[1] = {b / sm_disk_base::get_entries_per_block()}; auto mindex = bitmaps_.lookup(key); if (!mindex) throw runtime_error("Couldn't lookup bitmap"); return *mindex; } void save_ie(block_address b, struct index_entry ie) { uint64_t key[1] = {b / sm_disk_base::get_entries_per_block()}; bitmaps_.insert(key, ie); } btree<1, index_entry_traits, BlockSize> bitmaps_; }; } template persistent_space_map::ptr create_disk_sm(typename transaction_manager::ptr tm, block_address nr_blocks) { using namespace sm_disk_detail; typename persistent_space_map::ptr sm( new sm_disk(tm)); sm->extend(nr_blocks); return sm; } template persistent_space_map::ptr open_disk_sm(typename transaction_manager::ptr tm, void *root) { using namespace sm_disk_detail; sm_root_disk d; sm_root v; ::memcpy(&d, root, sizeof(d)); sm_root_traits::unpack(d, v); return typename persistent_space_map::ptr( new sm_disk(tm, v)); } } //---------------------------------------------------------------- #endif