intermodal/src/hasher.rs

144 lines
3.2 KiB
Rust
Raw Normal View History

2019-05-24 01:25:55 -07:00
use crate::common::*;
pub(crate) struct Hasher {
buffer: Vec<u8>,
length: u64,
md5sum: bool,
piece_bytes_hashed: usize,
piece_length: usize,
pieces: PieceList,
2019-05-24 01:25:55 -07:00
sha1: Sha1,
progress_bar: Option<ProgressBar>,
2019-05-24 01:25:55 -07:00
}
impl Hasher {
pub(crate) fn new(md5sum: bool, piece_length: usize, progress_bar: Option<ProgressBar>) -> Self {
Self {
buffer: vec![0; piece_length],
2019-05-24 01:25:55 -07:00
length: 0,
piece_bytes_hashed: 0,
pieces: PieceList::new(),
2019-05-24 01:25:55 -07:00
sha1: Sha1::new(),
piece_length,
md5sum,
progress_bar,
2019-05-24 01:25:55 -07:00
}
}
pub(crate) fn hash_files(mut self, files: &Files) -> Result<(Mode, PieceList), Error> {
let mode = if let Some(contents) = files.contents() {
let files = self.hash_contents(&files.root(), contents)?;
2019-05-24 01:25:55 -07:00
Mode::Multiple { files }
2019-05-24 01:25:55 -07:00
} else {
let (md5sum, length) = self.hash_file(files.root())?;
2019-05-24 01:25:55 -07:00
Mode::Single { md5sum, length }
};
2019-05-24 01:25:55 -07:00
self.finish();
Ok((mode, self.pieces))
}
pub(crate) fn hash_stdin(mut self, stdin: &mut dyn BufRead) -> Result<(Mode, PieceList), Error> {
let (md5sum, length) = self.hash_read_io(stdin).context(error::Stdin)?;
let mode = Mode::Single { md5sum, length };
self.finish();
Ok((mode, self.pieces))
}
fn finish(&mut self) {
if self.piece_bytes_hashed > 0 {
self.pieces.push(self.sha1.digest().into());
self.sha1.reset();
self.piece_bytes_hashed = 0;
2019-05-24 01:25:55 -07:00
}
}
fn hash_contents(
&mut self,
root: &Path,
file_paths: &[FilePath],
) -> Result<Vec<FileInfo>, Error> {
let mut files = Vec::new();
for file_path in file_paths {
let path = file_path.absolute(root);
let (md5sum, length) = self.hash_file(&path)?;
files.push(FileInfo {
path: file_path.clone(),
md5sum,
length,
});
2019-05-24 01:25:55 -07:00
}
Ok(files)
2019-05-24 01:25:55 -07:00
}
fn hash_file(&mut self, path: &Path) -> Result<(Option<Md5Digest>, Bytes), Error> {
let file = File::open(path).context(error::Filesystem { path })?;
2019-05-24 01:25:55 -07:00
self
.hash_read_io(&mut BufReader::new(file))
.context(error::Filesystem { path })
2019-05-24 01:25:55 -07:00
}
fn hash_read_io(&mut self, file: &mut dyn BufRead) -> io::Result<(Option<Md5Digest>, Bytes)> {
let buffer_len = self.buffer.len();
let mut bytes_hashed = 0;
2019-05-24 01:25:55 -07:00
let mut md5 = if self.md5sum {
Some(md5::Context::new())
} else {
None
};
loop {
let buffer = &mut self.buffer[..buffer_len];
let bytes_read = file.read(buffer)?;
if bytes_read == 0 {
break;
}
2019-05-24 01:25:55 -07:00
bytes_hashed += bytes_read;
2019-05-24 01:25:55 -07:00
let read = &buffer[0..bytes_read];
for byte in read.iter().cloned() {
2019-05-24 01:25:55 -07:00
self.sha1.update(&[byte]);
self.piece_bytes_hashed += 1;
if self.piece_bytes_hashed == self.piece_length {
self.pieces.push(self.sha1.digest().into());
2019-05-24 01:25:55 -07:00
self.sha1.reset();
self.piece_bytes_hashed = 0;
}
}
if let Some(md5) = md5.as_mut() {
md5.consume(read);
2019-05-24 01:25:55 -07:00
}
if let Some(progress_bar) = &self.progress_bar {
progress_bar.inc(bytes_read.into_u64());
}
2019-05-24 01:25:55 -07:00
}
self.length += bytes_hashed.into_u64();
2019-05-24 01:25:55 -07:00
Ok((
md5.map(|context| context.compute().into()),
Bytes::from(bytes_hashed.into_u64()),
))
2019-05-24 01:25:55 -07:00
}
}