From 9c44a4d08fb357db60a49ca260e5321d520a5d75 Mon Sep 17 00:00:00 2001 From: Antioch Peverell Date: Tue, 23 Feb 2021 11:40:26 +0000 Subject: [PATCH] Refactor prune file replace (#3571) * split prune file rewrite into two steps only one needs a mut ref to self * write both tmp files then replace --- store/src/pmmr.rs | 22 ++++++++++------ store/src/types.rs | 62 +++++++++++++++++++++++++++------------------- 2 files changed, 51 insertions(+), 33 deletions(-) diff --git a/store/src/pmmr.rs b/store/src/pmmr.rs index 269afbb11..908d59b8e 100644 --- a/store/src/pmmr.rs +++ b/store/src/pmmr.rs @@ -352,17 +352,17 @@ impl PMMRBackend { // on the cutoff_pos provided. let (leaves_removed, pos_to_rm) = self.pos_to_rm(cutoff_pos, rewind_rm_pos); - // 1. Save compact copy of the hash file, skipping removed data. + // Save compact copy of the hash file, skipping removed data. { let pos_to_rm = map_vec!(pos_to_rm, |pos| { let shift = self.prune_list.get_shift(pos.into()); pos as u64 - shift }); - self.hash_file.save_prune(&pos_to_rm)?; + self.hash_file.write_tmp_pruned(&pos_to_rm)?; } - // 2. Save compact copy of the data file, skipping removed leaves. + // Save compact copy of the data file, skipping removed leaves. { let leaf_pos_to_rm = pos_to_rm .iter() @@ -376,10 +376,19 @@ impl PMMRBackend { flat_pos - shift }); - self.data_file.save_prune(&pos_to_rm)?; + self.data_file.write_tmp_pruned(&pos_to_rm)?; } - // 3. Update the prune list and write to disk. + // Replace hash and data files with compact copies. + // Rebuild and intialize from the new files. + { + debug!("compact: about to replace hash and data files and rebuild..."); + self.hash_file.replace_with_tmp()?; + self.data_file.replace_with_tmp()?; + debug!("compact: ...finished replacing and rebuilding"); + } + + // Update the prune list and write to disk. { for pos in leaves_removed.iter() { self.prune_list.add(pos.into()); @@ -387,11 +396,10 @@ impl PMMRBackend { self.prune_list.flush()?; } - // 4. Write the leaf_set to disk. + // Write the leaf_set to disk. // Optimize the bitmap storage in the process. self.leaf_set.flush()?; - // 5. cleanup rewind files self.clean_rewind_files()?; Ok(true) diff --git a/store/src/types.rs b/store/src/types.rs index df21a1719..4fd8105be 100644 --- a/store/src/types.rs +++ b/store/src/types.rs @@ -154,10 +154,16 @@ where } /// Write the file out to disk, pruning removed elements. - pub fn save_prune(&mut self, prune_pos: &[u64]) -> io::Result<()> { + pub fn write_tmp_pruned(&self, prune_pos: &[u64]) -> io::Result<()> { // Need to convert from 1-index to 0-index (don't ask). let prune_idx: Vec<_> = prune_pos.iter().map(|x| x - 1).collect(); - self.file.save_prune(prune_idx.as_slice()) + self.file.write_tmp_pruned(prune_idx.as_slice()) + } + + /// Replace with file at tmp path. + /// Rebuild and initialize from new file. + pub fn replace_with_tmp(&mut self) -> io::Result<()> { + self.file.replace_with_tmp() } } @@ -485,39 +491,43 @@ where Ok(file) } + fn tmp_path(&self) -> PathBuf { + self.path.with_extension("tmp") + } + /// Saves a copy of the current file content, skipping data at the provided /// prune positions. prune_pos must be ordered. - pub fn save_prune(&mut self, prune_pos: &[u64]) -> io::Result<()> { - let tmp_path = self.path.with_extension("tmp"); + pub fn write_tmp_pruned(&self, prune_pos: &[u64]) -> io::Result<()> { + let reader = File::open(&self.path)?; + let mut buf_reader = BufReader::new(reader); + let mut streaming_reader = StreamingReader::new(&mut buf_reader, self.version); - // Scope the reader and writer to within the block so we can safely replace files later on. - { - let reader = File::open(&self.path)?; - let mut buf_reader = BufReader::new(reader); - let mut streaming_reader = StreamingReader::new(&mut buf_reader, self.version); + let mut buf_writer = BufWriter::new(File::create(&self.tmp_path())?); + let mut bin_writer = BinWriter::new(&mut buf_writer, self.version); - let mut buf_writer = BufWriter::new(File::create(&tmp_path)?); - let mut bin_writer = BinWriter::new(&mut buf_writer, self.version); - - let mut current_pos = 0; - let mut prune_pos = prune_pos; - while let Ok(elmt) = T::read(&mut streaming_reader) { - if prune_pos.contains(¤t_pos) { - // Pruned pos, moving on. - prune_pos = &prune_pos[1..]; - } else { - // Not pruned, write to file. - elmt.write(&mut bin_writer) - .map_err(|e| io::Error::new(io::ErrorKind::Other, e))?; - } - current_pos += 1; + let mut current_pos = 0; + let mut prune_pos = prune_pos; + while let Ok(elmt) = T::read(&mut streaming_reader) { + if prune_pos.contains(¤t_pos) { + // Pruned pos, moving on. + prune_pos = &prune_pos[1..]; + } else { + // Not pruned, write to file. + elmt.write(&mut bin_writer) + .map_err(|e| io::Error::new(io::ErrorKind::Other, e))?; } - buf_writer.flush()?; + current_pos += 1; } + buf_writer.flush()?; + Ok(()) + } + /// Replace the underlying file with the file at tmp path. + /// Rebuild and initialize from the new file. + pub fn replace_with_tmp(&mut self) -> io::Result<()> { // Replace the underlying file - // pmmr_data.tmp -> pmmr_data.bin - self.replace(&tmp_path)?; + self.replace(&self.tmp_path())?; // Now rebuild our size file to reflect the pruned data file. // This will replace the underlying file internally.