[thin_check (rust)] First attempt at multithreading the tree walking.
Still using a single io engine, so little benefit.
This commit is contained in:
parent
d5597d5d36
commit
4f120911d2
10
Cargo.lock
generated
10
Cargo.lock
generated
@ -619,6 +619,7 @@ dependencies = [
|
|||||||
"rand",
|
"rand",
|
||||||
"tempfile",
|
"tempfile",
|
||||||
"thiserror",
|
"thiserror",
|
||||||
|
"threadpool",
|
||||||
]
|
]
|
||||||
|
|
||||||
[[package]]
|
[[package]]
|
||||||
@ -650,6 +651,15 @@ dependencies = [
|
|||||||
"lazy_static",
|
"lazy_static",
|
||||||
]
|
]
|
||||||
|
|
||||||
|
[[package]]
|
||||||
|
name = "threadpool"
|
||||||
|
version = "1.8.1"
|
||||||
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||||
|
checksum = "d050e60b33d41c19108b32cea32164033a9013fe3b46cbd4457559bfbf77afaa"
|
||||||
|
dependencies = [
|
||||||
|
"num_cpus",
|
||||||
|
]
|
||||||
|
|
||||||
[[package]]
|
[[package]]
|
||||||
name = "unicode-width"
|
name = "unicode-width"
|
||||||
version = "0.1.8"
|
version = "0.1.8"
|
||||||
|
@ -23,6 +23,7 @@ num-traits = "0.2"
|
|||||||
quick-xml = "0.18"
|
quick-xml = "0.18"
|
||||||
rand = "0.7"
|
rand = "0.7"
|
||||||
tempfile = "3.1"
|
tempfile = "3.1"
|
||||||
|
threadpool = "1.8"
|
||||||
thiserror = "1.0"
|
thiserror = "1.0"
|
||||||
|
|
||||||
[dev-dependencies]
|
[dev-dependencies]
|
||||||
|
@ -6,7 +6,7 @@ use std::fs::OpenOptions;
|
|||||||
use std::io;
|
use std::io;
|
||||||
use std::io::{Read, Seek};
|
use std::io::{Read, Seek};
|
||||||
use std::os::unix::fs::OpenOptionsExt;
|
use std::os::unix::fs::OpenOptionsExt;
|
||||||
use std::os::unix::io::AsRawFd;
|
use std::os::unix::io::{RawFd, AsRawFd};
|
||||||
use std::path::Path;
|
use std::path::Path;
|
||||||
use std::sync::{Arc, Mutex};
|
use std::sync::{Arc, Mutex};
|
||||||
use io_uring::opcode::{self, types};
|
use io_uring::opcode::{self, types};
|
||||||
@ -45,6 +45,8 @@ impl Drop for Block {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
unsafe impl Send for Block {}
|
||||||
|
|
||||||
//------------------------------------------
|
//------------------------------------------
|
||||||
|
|
||||||
pub trait IoEngine {
|
pub trait IoEngine {
|
||||||
@ -105,9 +107,11 @@ impl IoEngine for SyncIoEngine {
|
|||||||
//------------------------------------------
|
//------------------------------------------
|
||||||
|
|
||||||
pub struct AsyncIoEngine {
|
pub struct AsyncIoEngine {
|
||||||
|
queue_len: u32,
|
||||||
ring: IoUring,
|
ring: IoUring,
|
||||||
nr_blocks: u64,
|
nr_blocks: u64,
|
||||||
input: File,
|
fd: RawFd,
|
||||||
|
input: Arc<File>,
|
||||||
}
|
}
|
||||||
|
|
||||||
impl AsyncIoEngine {
|
impl AsyncIoEngine {
|
||||||
@ -118,14 +122,29 @@ impl AsyncIoEngine {
|
|||||||
.custom_flags(libc::O_DIRECT)
|
.custom_flags(libc::O_DIRECT)
|
||||||
.open(path)?;
|
.open(path)?;
|
||||||
|
|
||||||
Ok(AsyncIoEngine {
|
Ok (AsyncIoEngine {
|
||||||
|
queue_len,
|
||||||
ring: IoUring::new(queue_len)?,
|
ring: IoUring::new(queue_len)?,
|
||||||
nr_blocks: get_nr_blocks(path)?,
|
nr_blocks: get_nr_blocks(path)?,
|
||||||
input,
|
fd: input.as_raw_fd(),
|
||||||
|
input: Arc::new(input),
|
||||||
})
|
})
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
impl Clone for AsyncIoEngine {
|
||||||
|
fn clone(&self) -> AsyncIoEngine {
|
||||||
|
eprintln!("in clone, queue_len = {}", self.queue_len);
|
||||||
|
AsyncIoEngine {
|
||||||
|
queue_len: self.queue_len,
|
||||||
|
ring: IoUring::new(self.queue_len).expect("couldn't create uring"),
|
||||||
|
nr_blocks: self.nr_blocks,
|
||||||
|
fd: self.fd,
|
||||||
|
input: self.input.clone(),
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
impl IoEngine for AsyncIoEngine {
|
impl IoEngine for AsyncIoEngine {
|
||||||
fn get_nr_blocks(&self) -> u64 {
|
fn get_nr_blocks(&self) -> u64 {
|
||||||
self.nr_blocks
|
self.nr_blocks
|
||||||
|
@ -6,8 +6,9 @@ use std::collections::HashSet;
|
|||||||
use std::error::Error;
|
use std::error::Error;
|
||||||
use std::path::Path;
|
use std::path::Path;
|
||||||
use std::sync::{Arc, Mutex};
|
use std::sync::{Arc, Mutex};
|
||||||
use std::thread;
|
use std::thread::{self, spawn};
|
||||||
use std::time::{Duration, Instant};
|
use std::time::{Duration, Instant};
|
||||||
|
use threadpool::ThreadPool;
|
||||||
|
|
||||||
use crate::block_manager::{AsyncIoEngine, Block, IoEngine, SyncIoEngine, BLOCK_SIZE};
|
use crate::block_manager::{AsyncIoEngine, Block, IoEngine, SyncIoEngine, BLOCK_SIZE};
|
||||||
use crate::checksum;
|
use crate::checksum;
|
||||||
@ -140,19 +141,22 @@ impl ValueType for ValueU64 {
|
|||||||
//------------------------------------------
|
//------------------------------------------
|
||||||
|
|
||||||
trait NodeVisitor<V: ValueType> {
|
trait NodeVisitor<V: ValueType> {
|
||||||
fn visit<'a>(&mut self, w: &mut BTreeWalker<'a>, b: &Block, node: &Node<V>) -> Result<()>;
|
fn visit<'a>(&mut self, w: &BTreeWalker, b: &Block, node: &Node<V>) -> Result<()>;
|
||||||
}
|
}
|
||||||
|
|
||||||
struct BTreeWalker<'a> {
|
#[derive(Clone)]
|
||||||
engine: &'a mut dyn IoEngine,
|
struct BTreeWalker {
|
||||||
seen: &'a mut FixedBitSet,
|
engine: Arc<Mutex<AsyncIoEngine>>,
|
||||||
|
seen: Arc<Mutex<FixedBitSet>>,
|
||||||
}
|
}
|
||||||
|
|
||||||
impl<'a> BTreeWalker<'a> {
|
impl BTreeWalker {
|
||||||
fn new(engine: &'a mut dyn IoEngine, seen: &'a mut FixedBitSet) -> BTreeWalker<'a> {
|
fn new(engine: AsyncIoEngine) -> BTreeWalker {
|
||||||
let nr_blocks = engine.get_nr_blocks() as usize;
|
let nr_blocks = engine.get_nr_blocks() as usize;
|
||||||
assert_eq!(seen.len(), nr_blocks);
|
let r: BTreeWalker = BTreeWalker {
|
||||||
let r: BTreeWalker<'a> = BTreeWalker { engine, seen };
|
engine: Arc::new(Mutex::new(engine)),
|
||||||
|
seen: Arc::new(Mutex::new(FixedBitSet::with_capacity(nr_blocks))),
|
||||||
|
};
|
||||||
r
|
r
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -162,13 +166,17 @@ impl<'a> BTreeWalker<'a> {
|
|||||||
V: ValueType,
|
V: ValueType,
|
||||||
{
|
{
|
||||||
let mut blocks = Vec::new();
|
let mut blocks = Vec::new();
|
||||||
|
let seen = self.seen.lock().unwrap();
|
||||||
for b in bs {
|
for b in bs {
|
||||||
if !self.seen[*b as usize] {
|
if !seen[*b as usize] {
|
||||||
blocks.push(Block::new(*b));
|
blocks.push(Block::new(*b));
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
drop(seen);
|
||||||
|
|
||||||
self.engine.read_many(&mut blocks)?;
|
let mut engine = self.engine.lock().unwrap();
|
||||||
|
engine.read_many(&mut blocks)?;
|
||||||
|
drop(engine);
|
||||||
|
|
||||||
for b in blocks {
|
for b in blocks {
|
||||||
self.walk_node(visitor, &b)?;
|
self.walk_node(visitor, &b)?;
|
||||||
@ -182,7 +190,9 @@ impl<'a> BTreeWalker<'a> {
|
|||||||
NV: NodeVisitor<V>,
|
NV: NodeVisitor<V>,
|
||||||
V: ValueType,
|
V: ValueType,
|
||||||
{
|
{
|
||||||
self.seen.insert(b.loc as usize);
|
let mut seen = self.seen.lock().unwrap();
|
||||||
|
seen.insert(b.loc as usize);
|
||||||
|
drop(seen);
|
||||||
|
|
||||||
let bt = checksum::metadata_block_type(b.get_data());
|
let bt = checksum::metadata_block_type(b.get_data());
|
||||||
if bt != checksum::BT::NODE {
|
if bt != checksum::BT::NODE {
|
||||||
@ -234,16 +244,49 @@ impl ValueType for ValueBlockTime {
|
|||||||
struct TopLevelVisitor {}
|
struct TopLevelVisitor {}
|
||||||
|
|
||||||
impl NodeVisitor<ValueU64> for TopLevelVisitor {
|
impl NodeVisitor<ValueU64> for TopLevelVisitor {
|
||||||
fn visit(&mut self, w: &mut BTreeWalker, _b: &Block, node: &Node<ValueU64>) -> Result<()> {
|
fn visit(&mut self, w: &BTreeWalker, _b: &Block, node: &Node<ValueU64>) -> Result<()> {
|
||||||
if let Node::Leaf {
|
if let Node::Leaf {
|
||||||
header: _h,
|
header: _h,
|
||||||
keys,
|
keys,
|
||||||
values,
|
values,
|
||||||
} = node
|
} = node
|
||||||
{
|
{
|
||||||
let mut v = BottomLevelVisitor {};
|
let mut blocks = Vec::new();
|
||||||
w.walk_nodes(&mut v, values)?;
|
let mut thin_ids = Vec::new();
|
||||||
|
let seen = w.seen.lock().unwrap();
|
||||||
|
for n in 0..keys.len() {
|
||||||
|
let b = values[n];
|
||||||
|
if !seen[b as usize] {
|
||||||
|
thin_ids.push(keys[n]);
|
||||||
|
blocks.push(Block::new(b));
|
||||||
}
|
}
|
||||||
|
}
|
||||||
|
drop(seen);
|
||||||
|
|
||||||
|
let mut engine = w.engine.lock().unwrap();
|
||||||
|
engine.read_many(&mut blocks)?;
|
||||||
|
drop(engine);
|
||||||
|
|
||||||
|
// FIXME: with a thread pool we need to return errors another way.
|
||||||
|
let nr_workers = 16;
|
||||||
|
let pool = ThreadPool::new(nr_workers);
|
||||||
|
|
||||||
|
let mut n = 0;
|
||||||
|
for b in blocks {
|
||||||
|
let thin_id = thin_ids[n];
|
||||||
|
n += 1;
|
||||||
|
|
||||||
|
let mut w = w.clone();
|
||||||
|
pool.execute(move || {
|
||||||
|
let mut v = BottomLevelVisitor {};
|
||||||
|
w.walk_node(&mut v, &b);
|
||||||
|
eprintln!("checked thin_dev {}", thin_id);
|
||||||
|
});
|
||||||
|
}
|
||||||
|
|
||||||
|
pool.join();
|
||||||
|
}
|
||||||
|
|
||||||
Ok(())
|
Ok(())
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
@ -251,12 +294,7 @@ impl NodeVisitor<ValueU64> for TopLevelVisitor {
|
|||||||
struct BottomLevelVisitor {}
|
struct BottomLevelVisitor {}
|
||||||
|
|
||||||
impl NodeVisitor<ValueBlockTime> for BottomLevelVisitor {
|
impl NodeVisitor<ValueBlockTime> for BottomLevelVisitor {
|
||||||
fn visit(
|
fn visit(&mut self, _w: &BTreeWalker, _b: &Block, _node: &Node<ValueBlockTime>) -> Result<()> {
|
||||||
&mut self,
|
|
||||||
_w: &mut BTreeWalker,
|
|
||||||
_b: &Block,
|
|
||||||
_node: &Node<ValueBlockTime>,
|
|
||||||
) -> Result<()> {
|
|
||||||
Ok(())
|
Ok(())
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
@ -275,10 +313,12 @@ pub fn check(dev: &Path) -> Result<()> {
|
|||||||
engine.read(&mut root)?;
|
engine.read(&mut root)?;
|
||||||
|
|
||||||
let mut seen = FixedBitSet::with_capacity(engine.get_nr_blocks() as usize);
|
let mut seen = FixedBitSet::with_capacity(engine.get_nr_blocks() as usize);
|
||||||
let mut w = BTreeWalker::new(&mut engine, &mut seen);
|
let mut w = BTreeWalker::new(engine);
|
||||||
let mut visitor = TopLevelVisitor {};
|
let mut visitor = TopLevelVisitor {};
|
||||||
let result = w.walk_node(&mut visitor, &root)?;
|
let result = w.walk_node(&mut visitor, &root)?;
|
||||||
println!("read mapping tree in {} ms", now.elapsed().as_millis());
|
println!("read mapping tree in {} ms", now.elapsed().as_millis());
|
||||||
|
|
||||||
Ok(())
|
Ok(())
|
||||||
}
|
}
|
||||||
|
|
||||||
|
//------------------------------------------
|
||||||
|
Loading…
Reference in New Issue
Block a user