2020-07-28 15:21:48 +05:30
|
|
|
use anyhow::{anyhow, Result};
|
2020-07-29 15:42:03 +05:30
|
|
|
use fixedbitset::FixedBitSet;
|
2020-07-30 14:42:51 +05:30
|
|
|
use nom::{number::complete::*, IResult};
|
2020-07-27 20:23:42 +05:30
|
|
|
use std::path::Path;
|
|
|
|
use std::sync::{Arc, Mutex};
|
2020-07-30 14:42:51 +05:30
|
|
|
use std::time::Instant;
|
2020-07-29 21:08:52 +05:30
|
|
|
use threadpool::ThreadPool;
|
2020-06-09 13:45:00 +05:30
|
|
|
|
2020-07-30 14:42:51 +05:30
|
|
|
use crate::block_manager::{AsyncIoEngine, Block, IoEngine};
|
2020-07-28 15:21:48 +05:30
|
|
|
use crate::checksum;
|
|
|
|
use crate::thin::superblock::*;
|
2020-06-09 13:45:00 +05:30
|
|
|
|
2020-07-29 15:42:03 +05:30
|
|
|
//------------------------------------------
|
|
|
|
|
2020-07-28 15:21:48 +05:30
|
|
|
trait ValueType {
|
|
|
|
type Value;
|
|
|
|
fn unpack(data: &[u8]) -> IResult<&[u8], Self::Value>;
|
|
|
|
}
|
|
|
|
|
2020-07-30 14:42:51 +05:30
|
|
|
#[allow(dead_code)]
|
2020-07-28 15:21:48 +05:30
|
|
|
struct NodeHeader {
|
|
|
|
is_leaf: bool,
|
|
|
|
block: u64,
|
|
|
|
nr_entries: u32,
|
|
|
|
max_entries: u32,
|
|
|
|
value_size: u32,
|
|
|
|
}
|
|
|
|
|
2020-07-30 14:42:51 +05:30
|
|
|
#[allow(dead_code)]
|
2020-07-28 15:21:48 +05:30
|
|
|
const INTERNAL_NODE: u32 = 1;
|
|
|
|
const LEAF_NODE: u32 = 2;
|
|
|
|
|
|
|
|
fn unpack_node_header(data: &[u8]) -> IResult<&[u8], NodeHeader> {
|
|
|
|
let (i, _csum) = le_u32(data)?;
|
|
|
|
let (i, flags) = le_u32(i)?;
|
|
|
|
let (i, block) = le_u64(i)?;
|
|
|
|
let (i, nr_entries) = le_u32(i)?;
|
|
|
|
let (i, max_entries) = le_u32(i)?;
|
|
|
|
let (i, value_size) = le_u32(i)?;
|
|
|
|
let (i, _padding) = le_u32(i)?;
|
|
|
|
|
|
|
|
Ok((
|
|
|
|
i,
|
|
|
|
NodeHeader {
|
|
|
|
is_leaf: flags == LEAF_NODE,
|
|
|
|
block,
|
|
|
|
nr_entries,
|
|
|
|
max_entries,
|
|
|
|
value_size,
|
|
|
|
},
|
|
|
|
))
|
|
|
|
}
|
|
|
|
|
|
|
|
enum Node<V: ValueType> {
|
|
|
|
Internal {
|
|
|
|
header: NodeHeader,
|
|
|
|
keys: Vec<u64>,
|
|
|
|
values: Vec<u64>,
|
|
|
|
},
|
|
|
|
Leaf {
|
|
|
|
header: NodeHeader,
|
|
|
|
keys: Vec<u64>,
|
|
|
|
values: Vec<V::Value>,
|
|
|
|
},
|
|
|
|
}
|
|
|
|
|
|
|
|
fn unpack_node_<V: ValueType>(data: &[u8]) -> IResult<&[u8], Node<V>> {
|
|
|
|
use nom::multi::count;
|
|
|
|
|
|
|
|
let (i, header) = unpack_node_header(data)?;
|
|
|
|
let (i, keys) = count(le_u64, header.nr_entries as usize)(i)?;
|
|
|
|
|
|
|
|
let nr_free = header.max_entries - header.nr_entries;
|
|
|
|
let (i, _padding) = count(le_u64, nr_free as usize)(i)?;
|
|
|
|
|
|
|
|
if header.is_leaf {
|
|
|
|
let (i, values) = count(V::unpack, header.nr_entries as usize)(i)?;
|
|
|
|
Ok((
|
|
|
|
i,
|
|
|
|
Node::Leaf {
|
|
|
|
header,
|
|
|
|
keys,
|
|
|
|
values,
|
|
|
|
},
|
|
|
|
))
|
|
|
|
} else {
|
|
|
|
let (i, values) = count(le_u64, header.nr_entries as usize)(i)?;
|
|
|
|
Ok((
|
|
|
|
i,
|
|
|
|
Node::Internal {
|
|
|
|
header,
|
|
|
|
keys,
|
|
|
|
values,
|
|
|
|
},
|
|
|
|
))
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
fn unpack_node<V: ValueType>(data: &[u8]) -> Result<Node<V>> {
|
|
|
|
if let Ok((_i, node)) = unpack_node_(data) {
|
|
|
|
Ok(node)
|
|
|
|
} else {
|
|
|
|
Err(anyhow!("couldn't unpack btree node"))
|
|
|
|
}
|
|
|
|
}
|
2020-06-09 13:45:00 +05:30
|
|
|
|
2020-07-29 15:42:03 +05:30
|
|
|
//------------------------------------------
|
|
|
|
|
2020-07-28 15:21:48 +05:30
|
|
|
struct ValueU64;
|
|
|
|
|
|
|
|
impl ValueType for ValueU64 {
|
|
|
|
type Value = u64;
|
|
|
|
fn unpack(i: &[u8]) -> IResult<&[u8], u64> {
|
|
|
|
le_u64(i)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-07-29 15:42:03 +05:30
|
|
|
//------------------------------------------
|
|
|
|
|
|
|
|
trait NodeVisitor<V: ValueType> {
|
2020-07-29 21:08:52 +05:30
|
|
|
fn visit<'a>(&mut self, w: &BTreeWalker, b: &Block, node: &Node<V>) -> Result<()>;
|
2020-07-29 15:42:03 +05:30
|
|
|
}
|
|
|
|
|
2020-07-29 21:08:52 +05:30
|
|
|
#[derive(Clone)]
|
|
|
|
struct BTreeWalker {
|
2020-07-30 14:29:02 +05:30
|
|
|
engine: Arc<AsyncIoEngine>,
|
2020-07-29 21:08:52 +05:30
|
|
|
seen: Arc<Mutex<FixedBitSet>>,
|
2020-07-29 15:42:03 +05:30
|
|
|
}
|
|
|
|
|
2020-07-29 21:08:52 +05:30
|
|
|
impl BTreeWalker {
|
|
|
|
fn new(engine: AsyncIoEngine) -> BTreeWalker {
|
2020-07-29 15:42:03 +05:30
|
|
|
let nr_blocks = engine.get_nr_blocks() as usize;
|
2020-07-29 21:08:52 +05:30
|
|
|
let r: BTreeWalker = BTreeWalker {
|
2020-07-30 14:29:02 +05:30
|
|
|
engine: Arc::new(engine),
|
2020-07-29 21:08:52 +05:30
|
|
|
seen: Arc::new(Mutex::new(FixedBitSet::with_capacity(nr_blocks))),
|
|
|
|
};
|
2020-07-29 15:42:03 +05:30
|
|
|
r
|
|
|
|
}
|
|
|
|
|
|
|
|
fn walk_nodes<NV, V>(&mut self, visitor: &mut NV, bs: &Vec<u64>) -> Result<()>
|
|
|
|
where
|
|
|
|
NV: NodeVisitor<V>,
|
|
|
|
V: ValueType,
|
|
|
|
{
|
|
|
|
let mut blocks = Vec::new();
|
2020-07-29 21:08:52 +05:30
|
|
|
let seen = self.seen.lock().unwrap();
|
2020-07-29 15:42:03 +05:30
|
|
|
for b in bs {
|
2020-07-29 21:08:52 +05:30
|
|
|
if !seen[*b as usize] {
|
2020-07-29 15:42:03 +05:30
|
|
|
blocks.push(Block::new(*b));
|
|
|
|
}
|
|
|
|
}
|
2020-07-29 21:08:52 +05:30
|
|
|
drop(seen);
|
2020-07-29 15:42:03 +05:30
|
|
|
|
2020-07-30 14:29:02 +05:30
|
|
|
self.engine.read_many(&mut blocks)?;
|
2020-07-29 15:42:03 +05:30
|
|
|
|
|
|
|
for b in blocks {
|
|
|
|
self.walk_node(visitor, &b)?;
|
|
|
|
}
|
|
|
|
|
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
|
|
|
|
fn walk_node<NV, V>(&mut self, visitor: &mut NV, b: &Block) -> Result<()>
|
|
|
|
where
|
|
|
|
NV: NodeVisitor<V>,
|
|
|
|
V: ValueType,
|
|
|
|
{
|
2020-07-29 21:08:52 +05:30
|
|
|
let mut seen = self.seen.lock().unwrap();
|
|
|
|
seen.insert(b.loc as usize);
|
|
|
|
drop(seen);
|
2020-07-29 15:42:03 +05:30
|
|
|
|
|
|
|
let bt = checksum::metadata_block_type(b.get_data());
|
|
|
|
if bt != checksum::BT::NODE {
|
|
|
|
return Err(anyhow!("checksum failed for node {}, {:?}", b.loc, bt));
|
|
|
|
}
|
|
|
|
|
|
|
|
let node = unpack_node::<V>(&b.get_data())?;
|
|
|
|
visitor.visit(self, &b, &node)?;
|
|
|
|
|
|
|
|
if let Node::Internal {
|
|
|
|
header: _h,
|
|
|
|
keys: _k,
|
|
|
|
values,
|
|
|
|
} = node
|
|
|
|
{
|
|
|
|
self.walk_nodes(visitor, &values)?;
|
|
|
|
}
|
|
|
|
|
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
//------------------------------------------
|
|
|
|
|
2020-07-30 14:42:51 +05:30
|
|
|
#[allow(dead_code)]
|
2020-07-28 15:21:48 +05:30
|
|
|
struct BlockTime {
|
|
|
|
block: u64,
|
|
|
|
time: u32,
|
|
|
|
}
|
|
|
|
|
|
|
|
struct ValueBlockTime;
|
|
|
|
|
|
|
|
impl ValueType for ValueBlockTime {
|
|
|
|
type Value = BlockTime;
|
|
|
|
fn unpack(i: &[u8]) -> IResult<&[u8], BlockTime> {
|
|
|
|
let (i, n) = le_u64(i)?;
|
|
|
|
let block = n >> 24;
|
|
|
|
let time = n & ((1 << 24) - 1);
|
|
|
|
|
|
|
|
Ok((
|
|
|
|
i,
|
|
|
|
BlockTime {
|
|
|
|
block,
|
|
|
|
time: time as u32,
|
|
|
|
},
|
|
|
|
))
|
2020-06-09 13:45:00 +05:30
|
|
|
}
|
2020-07-28 15:21:48 +05:30
|
|
|
}
|
|
|
|
|
2020-07-29 15:42:03 +05:30
|
|
|
struct TopLevelVisitor {}
|
|
|
|
|
|
|
|
impl NodeVisitor<ValueU64> for TopLevelVisitor {
|
2020-07-29 21:08:52 +05:30
|
|
|
fn visit(&mut self, w: &BTreeWalker, _b: &Block, node: &Node<ValueU64>) -> Result<()> {
|
2020-07-29 15:42:03 +05:30
|
|
|
if let Node::Leaf {
|
|
|
|
header: _h,
|
|
|
|
keys,
|
|
|
|
values,
|
|
|
|
} = node
|
|
|
|
{
|
2020-07-29 21:08:52 +05:30
|
|
|
let mut blocks = Vec::new();
|
|
|
|
let mut thin_ids = Vec::new();
|
|
|
|
let seen = w.seen.lock().unwrap();
|
|
|
|
for n in 0..keys.len() {
|
|
|
|
let b = values[n];
|
|
|
|
if !seen[b as usize] {
|
|
|
|
thin_ids.push(keys[n]);
|
|
|
|
blocks.push(Block::new(b));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
drop(seen);
|
|
|
|
|
2020-07-30 14:29:02 +05:30
|
|
|
w.engine.read_many(&mut blocks)?;
|
2020-07-29 21:08:52 +05:30
|
|
|
|
|
|
|
// FIXME: with a thread pool we need to return errors another way.
|
|
|
|
let nr_workers = 16;
|
|
|
|
let pool = ThreadPool::new(nr_workers);
|
|
|
|
|
|
|
|
let mut n = 0;
|
|
|
|
for b in blocks {
|
|
|
|
let thin_id = thin_ids[n];
|
|
|
|
n += 1;
|
|
|
|
|
|
|
|
let mut w = w.clone();
|
|
|
|
pool.execute(move || {
|
|
|
|
let mut v = BottomLevelVisitor {};
|
2020-07-30 14:42:51 +05:30
|
|
|
w.walk_node(&mut v, &b).expect("walk failed"); // FIXME: return error
|
2020-07-29 21:08:52 +05:30
|
|
|
eprintln!("checked thin_dev {}", thin_id);
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
|
|
|
pool.join();
|
2020-07-28 16:15:25 +05:30
|
|
|
}
|
2020-07-29 21:08:52 +05:30
|
|
|
|
2020-07-29 15:42:03 +05:30
|
|
|
Ok(())
|
2020-07-28 16:15:25 +05:30
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-07-29 15:42:03 +05:30
|
|
|
struct BottomLevelVisitor {}
|
2020-07-28 15:21:48 +05:30
|
|
|
|
2020-07-29 15:42:03 +05:30
|
|
|
impl NodeVisitor<ValueBlockTime> for BottomLevelVisitor {
|
2020-07-29 21:08:52 +05:30
|
|
|
fn visit(&mut self, _w: &BTreeWalker, _b: &Block, _node: &Node<ValueBlockTime>) -> Result<()> {
|
2020-07-29 15:42:03 +05:30
|
|
|
Ok(())
|
2020-07-28 15:21:48 +05:30
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-07-29 15:42:03 +05:30
|
|
|
//------------------------------------------
|
|
|
|
|
2020-07-28 15:21:48 +05:30
|
|
|
pub fn check(dev: &Path) -> Result<()> {
|
2020-07-28 17:27:30 +05:30
|
|
|
//let mut engine = SyncIoEngine::new(dev)?;
|
|
|
|
let mut engine = AsyncIoEngine::new(dev, 256)?;
|
2020-06-09 13:45:00 +05:30
|
|
|
|
2020-07-27 20:23:42 +05:30
|
|
|
let now = Instant::now();
|
2020-07-28 15:21:48 +05:30
|
|
|
let sb = read_superblock(&mut engine, SUPERBLOCK_LOCATION)?;
|
|
|
|
eprintln!("{:?}", sb);
|
2020-07-28 16:15:25 +05:30
|
|
|
|
|
|
|
let mut root = Block::new(sb.mapping_root);
|
|
|
|
engine.read(&mut root)?;
|
|
|
|
|
2020-07-29 21:08:52 +05:30
|
|
|
let mut w = BTreeWalker::new(engine);
|
2020-07-29 15:42:03 +05:30
|
|
|
let mut visitor = TopLevelVisitor {};
|
2020-07-30 14:42:51 +05:30
|
|
|
let _result = w.walk_node(&mut visitor, &root)?;
|
2020-07-29 15:42:03 +05:30
|
|
|
println!("read mapping tree in {} ms", now.elapsed().as_millis());
|
2020-07-27 20:23:42 +05:30
|
|
|
|
2020-06-09 13:45:00 +05:30
|
|
|
Ok(())
|
|
|
|
}
|
2020-07-29 21:08:52 +05:30
|
|
|
|
|
|
|
//------------------------------------------
|