Skip to content

Commit

Permalink
Refactor prune file replace (#3571)
Browse files Browse the repository at this point in the history
* split prune file rewrite into two steps
only one needs a mut ref to self

* write both tmp files then replace
  • Loading branch information
antiochp authored Feb 23, 2021
1 parent a3c9b47 commit 9c44a4d
Show file tree
Hide file tree
Showing 2 changed files with 53 additions and 35 deletions.
22 changes: 15 additions & 7 deletions store/src/pmmr.rs
Original file line number Diff line number Diff line change
Expand Up @@ -352,17 +352,17 @@ impl<T: PMMRable> PMMRBackend<T> {
// on the cutoff_pos provided.
let (leaves_removed, pos_to_rm) = self.pos_to_rm(cutoff_pos, rewind_rm_pos);

// 1. Save compact copy of the hash file, skipping removed data.
// Save compact copy of the hash file, skipping removed data.
{
let pos_to_rm = map_vec!(pos_to_rm, |pos| {
let shift = self.prune_list.get_shift(pos.into());
pos as u64 - shift
});

self.hash_file.save_prune(&pos_to_rm)?;
self.hash_file.write_tmp_pruned(&pos_to_rm)?;
}

// 2. Save compact copy of the data file, skipping removed leaves.
// Save compact copy of the data file, skipping removed leaves.
{
let leaf_pos_to_rm = pos_to_rm
.iter()
Expand All @@ -376,22 +376,30 @@ impl<T: PMMRable> PMMRBackend<T> {
flat_pos - shift
});

self.data_file.save_prune(&pos_to_rm)?;
self.data_file.write_tmp_pruned(&pos_to_rm)?;
}

// 3. Update the prune list and write to disk.
// Replace hash and data files with compact copies.
// Rebuild and intialize from the new files.
{
debug!("compact: about to replace hash and data files and rebuild...");
self.hash_file.replace_with_tmp()?;
self.data_file.replace_with_tmp()?;
debug!("compact: ...finished replacing and rebuilding");
}

// Update the prune list and write to disk.
{
for pos in leaves_removed.iter() {
self.prune_list.add(pos.into());
}
self.prune_list.flush()?;
}

// 4. Write the leaf_set to disk.
// Write the leaf_set to disk.
// Optimize the bitmap storage in the process.
self.leaf_set.flush()?;

// 5. cleanup rewind files
self.clean_rewind_files()?;

Ok(true)
Expand Down
66 changes: 38 additions & 28 deletions store/src/types.rs
Original file line number Diff line number Diff line change
Expand Up @@ -154,10 +154,16 @@ where
}

/// Write the file out to disk, pruning removed elements.
pub fn save_prune(&mut self, prune_pos: &[u64]) -> io::Result<()> {
pub fn write_tmp_pruned(&self, prune_pos: &[u64]) -> io::Result<()> {
// Need to convert from 1-index to 0-index (don't ask).
let prune_idx: Vec<_> = prune_pos.iter().map(|x| x - 1).collect();
self.file.save_prune(prune_idx.as_slice())
self.file.write_tmp_pruned(prune_idx.as_slice())
}

/// Replace with file at tmp path.
/// Rebuild and initialize from new file.
pub fn replace_with_tmp(&mut self) -> io::Result<()> {
self.file.replace_with_tmp()
}
}

Expand Down Expand Up @@ -485,39 +491,43 @@ where
Ok(file)
}

fn tmp_path(&self) -> PathBuf {
self.path.with_extension("tmp")
}

/// Saves a copy of the current file content, skipping data at the provided
/// prune positions. prune_pos must be ordered.
pub fn save_prune(&mut self, prune_pos: &[u64]) -> io::Result<()> {
let tmp_path = self.path.with_extension("tmp");

// Scope the reader and writer to within the block so we can safely replace files later on.
{
let reader = File::open(&self.path)?;
let mut buf_reader = BufReader::new(reader);
let mut streaming_reader = StreamingReader::new(&mut buf_reader, self.version);

let mut buf_writer = BufWriter::new(File::create(&tmp_path)?);
let mut bin_writer = BinWriter::new(&mut buf_writer, self.version);

let mut current_pos = 0;
let mut prune_pos = prune_pos;
while let Ok(elmt) = T::read(&mut streaming_reader) {
if prune_pos.contains(&current_pos) {
// Pruned pos, moving on.
prune_pos = &prune_pos[1..];
} else {
// Not pruned, write to file.
elmt.write(&mut bin_writer)
.map_err(|e| io::Error::new(io::ErrorKind::Other, e))?;
}
current_pos += 1;
pub fn write_tmp_pruned(&self, prune_pos: &[u64]) -> io::Result<()> {
let reader = File::open(&self.path)?;
let mut buf_reader = BufReader::new(reader);
let mut streaming_reader = StreamingReader::new(&mut buf_reader, self.version);

let mut buf_writer = BufWriter::new(File::create(&self.tmp_path())?);
let mut bin_writer = BinWriter::new(&mut buf_writer, self.version);

let mut current_pos = 0;
let mut prune_pos = prune_pos;
while let Ok(elmt) = T::read(&mut streaming_reader) {
if prune_pos.contains(&current_pos) {
// Pruned pos, moving on.
prune_pos = &prune_pos[1..];
} else {
// Not pruned, write to file.
elmt.write(&mut bin_writer)
.map_err(|e| io::Error::new(io::ErrorKind::Other, e))?;
}
buf_writer.flush()?;
current_pos += 1;
}
buf_writer.flush()?;
Ok(())
}

/// Replace the underlying file with the file at tmp path.
/// Rebuild and initialize from the new file.
pub fn replace_with_tmp(&mut self) -> io::Result<()> {
// Replace the underlying file -
// pmmr_data.tmp -> pmmr_data.bin
self.replace(&tmp_path)?;
self.replace(&self.tmp_path())?;

// Now rebuild our size file to reflect the pruned data file.
// This will replace the underlying file internally.
Expand Down

0 comments on commit 9c44a4d

Please sign in to comment.