2020-02-06 01:01:44 +01:00
|
|
|
use crate::common::*;
|
|
|
|
|
2020-02-06 03:32:09 +01:00
|
|
|
const JUNK: &[&str] = &["Thumbs.db", "Desktop.ini"];
|
|
|
|
|
2020-02-06 06:47:12 +01:00
|
|
|
#[derive(Debug)]
|
|
|
|
struct Pattern {
|
|
|
|
glob: GlobMatcher,
|
|
|
|
include: bool,
|
|
|
|
}
|
|
|
|
|
2020-02-06 01:01:44 +01:00
|
|
|
pub(crate) struct Walker {
|
2020-02-06 03:32:09 +01:00
|
|
|
follow_symlinks: bool,
|
2020-02-06 01:01:44 +01:00
|
|
|
include_hidden: bool,
|
2020-02-06 03:32:09 +01:00
|
|
|
include_junk: bool,
|
2020-03-26 02:08:55 +01:00
|
|
|
file_order: FileOrder,
|
2020-02-06 06:47:12 +01:00
|
|
|
patterns: Vec<Pattern>,
|
2020-02-06 01:01:44 +01:00
|
|
|
root: PathBuf,
|
2020-03-12 00:04:22 +01:00
|
|
|
spinner: Option<ProgressBar>,
|
2020-02-06 01:01:44 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
impl Walker {
|
2020-03-12 00:04:22 +01:00
|
|
|
pub(crate) fn new(root: &Path) -> Self {
|
|
|
|
Self {
|
2020-02-06 03:32:09 +01:00
|
|
|
follow_symlinks: false,
|
2020-02-06 01:01:44 +01:00
|
|
|
include_hidden: false,
|
2020-02-06 03:32:09 +01:00
|
|
|
include_junk: false,
|
2020-03-26 02:08:55 +01:00
|
|
|
file_order: FileOrder::AlphabeticalAsc,
|
2020-02-06 06:47:12 +01:00
|
|
|
patterns: Vec::new(),
|
2020-02-06 01:01:44 +01:00
|
|
|
root: root.to_owned(),
|
2020-03-12 00:04:22 +01:00
|
|
|
spinner: None,
|
2020-02-06 01:01:44 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-02-06 03:32:09 +01:00
|
|
|
pub(crate) fn include_junk(self, include_junk: bool) -> Self {
|
2020-03-12 00:04:22 +01:00
|
|
|
Self {
|
2020-02-06 03:32:09 +01:00
|
|
|
include_junk,
|
|
|
|
..self
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
pub(crate) fn include_hidden(self, include_hidden: bool) -> Self {
|
2020-03-12 00:04:22 +01:00
|
|
|
Self {
|
2020-02-06 03:32:09 +01:00
|
|
|
include_hidden,
|
2020-02-06 01:01:44 +01:00
|
|
|
..self
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-03-26 02:08:55 +01:00
|
|
|
pub(crate) fn file_order(self, file_order: FileOrder) -> Self {
|
|
|
|
Self { file_order, ..self }
|
|
|
|
}
|
|
|
|
|
2020-02-06 06:47:12 +01:00
|
|
|
pub(crate) fn globs(mut self, globs: &[String]) -> Result<Self, Error> {
|
|
|
|
for glob in globs {
|
|
|
|
let exclude = glob.starts_with('!');
|
|
|
|
let glob = Glob::new(if exclude { &glob[1..] } else { glob })?.compile_matcher();
|
|
|
|
self.patterns.push(Pattern {
|
|
|
|
glob,
|
|
|
|
include: !exclude,
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
|
|
|
Ok(self)
|
|
|
|
}
|
|
|
|
|
2020-02-06 03:32:09 +01:00
|
|
|
pub(crate) fn follow_symlinks(self, follow_symlinks: bool) -> Self {
|
2020-03-12 00:04:22 +01:00
|
|
|
Self {
|
2020-02-06 03:32:09 +01:00
|
|
|
follow_symlinks,
|
2020-02-06 01:01:44 +01:00
|
|
|
..self
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-03-12 09:08:40 +01:00
|
|
|
pub(crate) fn spinner(self, spinner: Option<ProgressBar>) -> Self {
|
|
|
|
Self { spinner, ..self }
|
2020-03-12 00:04:22 +01:00
|
|
|
}
|
|
|
|
|
2020-02-06 01:01:44 +01:00
|
|
|
pub(crate) fn files(self) -> Result<Files, Error> {
|
2020-02-06 03:32:09 +01:00
|
|
|
if !self.follow_symlinks
|
|
|
|
&& self
|
|
|
|
.root
|
|
|
|
.symlink_metadata()
|
|
|
|
.context(error::Filesystem { path: &self.root })?
|
|
|
|
.file_type()
|
|
|
|
.is_symlink()
|
|
|
|
{
|
|
|
|
return Err(Error::SymlinkRoot { root: self.root });
|
|
|
|
}
|
2020-02-06 01:01:44 +01:00
|
|
|
|
2020-02-06 03:32:09 +01:00
|
|
|
let root_metadata = self
|
|
|
|
.root
|
|
|
|
.metadata()
|
|
|
|
.context(error::Filesystem { path: &self.root })?;
|
2020-02-06 01:01:44 +01:00
|
|
|
|
2020-02-06 03:32:09 +01:00
|
|
|
if root_metadata.is_file() {
|
|
|
|
return Ok(Files::file(self.root, Bytes::from(root_metadata.len())));
|
|
|
|
}
|
2020-02-06 01:01:44 +01:00
|
|
|
|
2020-02-06 03:32:09 +01:00
|
|
|
let filter = |entry: &walkdir::DirEntry| {
|
2020-02-06 01:01:44 +01:00
|
|
|
let path = entry.path();
|
|
|
|
|
2020-03-12 00:04:22 +01:00
|
|
|
if let Some(s) = &self.spinner {
|
|
|
|
let display_path = path.strip_prefix(&self.root).unwrap_or(&path);
|
|
|
|
s.set_message(&display_path.display().to_string());
|
|
|
|
s.tick();
|
|
|
|
}
|
|
|
|
|
2020-02-06 01:01:44 +01:00
|
|
|
let file_name = entry.file_name();
|
|
|
|
|
2020-02-06 03:32:09 +01:00
|
|
|
if !self.include_hidden && file_name.to_string_lossy().starts_with('.') {
|
|
|
|
return false;
|
2020-02-06 01:01:44 +01:00
|
|
|
}
|
|
|
|
|
2020-02-06 03:32:09 +01:00
|
|
|
let hidden = Platform::hidden(path).unwrap_or(true);
|
|
|
|
|
|
|
|
if !self.include_hidden && hidden {
|
|
|
|
return false;
|
2020-02-06 01:01:44 +01:00
|
|
|
}
|
|
|
|
|
2020-02-06 03:32:09 +01:00
|
|
|
true
|
|
|
|
};
|
|
|
|
|
2020-03-26 02:08:55 +01:00
|
|
|
let mut file_infos = Vec::new();
|
2020-02-06 03:32:09 +01:00
|
|
|
let mut total_size = 0;
|
|
|
|
for result in WalkDir::new(&self.root)
|
|
|
|
.follow_links(self.follow_symlinks)
|
|
|
|
.into_iter()
|
|
|
|
.filter_entry(filter)
|
|
|
|
{
|
|
|
|
let entry = result?;
|
|
|
|
|
|
|
|
let path = entry.path();
|
|
|
|
|
|
|
|
let metadata = entry.metadata()?;
|
|
|
|
|
|
|
|
if !metadata.is_file() {
|
2020-02-06 01:01:44 +01:00
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
2020-02-06 06:47:12 +01:00
|
|
|
let relative = path
|
|
|
|
.strip_prefix(&self.root)
|
|
|
|
.context(error::PathStripPrefix {
|
|
|
|
path,
|
|
|
|
prefix: &self.root,
|
|
|
|
})?;
|
|
|
|
|
|
|
|
if relative.components().count() == 0 {
|
|
|
|
return Err(Error::PathStripEmpty {
|
|
|
|
prefix: self.root.clone(),
|
|
|
|
path: path.to_owned(),
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
|
|
|
if !self.pattern_filter(&relative) {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
let file_path = FilePath::from_relative_path(relative)?;
|
2020-02-06 03:32:09 +01:00
|
|
|
|
|
|
|
if !self.include_junk && JUNK.contains(&file_path.name()) {
|
2020-02-06 01:01:44 +01:00
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
2020-03-26 02:08:55 +01:00
|
|
|
let len = metadata.len();
|
|
|
|
total_size += len;
|
2020-02-06 03:32:09 +01:00
|
|
|
|
2020-03-26 02:08:55 +01:00
|
|
|
file_infos.push(FileInfo {
|
|
|
|
path: file_path,
|
|
|
|
length: Bytes(len),
|
|
|
|
md5sum: None,
|
|
|
|
});
|
2020-02-06 01:01:44 +01:00
|
|
|
}
|
|
|
|
|
2020-03-26 02:08:55 +01:00
|
|
|
file_infos.sort_by(|a, b| self.file_order.compare_file_info(a, b));
|
|
|
|
|
|
|
|
Ok(Files::dir(
|
|
|
|
self.root,
|
|
|
|
Bytes::from(total_size),
|
|
|
|
file_infos
|
|
|
|
.into_iter()
|
|
|
|
.map(|file_info| file_info.path)
|
|
|
|
.collect(),
|
|
|
|
))
|
2020-02-06 01:01:44 +01:00
|
|
|
}
|
2020-02-06 06:47:12 +01:00
|
|
|
|
|
|
|
fn pattern_filter(&self, relative: &Path) -> bool {
|
|
|
|
for Pattern { glob, include } in self.patterns.iter().rev() {
|
|
|
|
if glob.is_match(relative) {
|
|
|
|
return *include;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if let Some(Pattern { include, .. }) = self.patterns.first() {
|
|
|
|
return !include;
|
|
|
|
}
|
|
|
|
|
|
|
|
true
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
#[cfg(test)]
|
|
|
|
mod tests {
|
|
|
|
use super::*;
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
fn glob() {
|
|
|
|
let walker = Walker::new(Path::new("foo"))
|
|
|
|
.globs(&["[bc]".into()])
|
|
|
|
.unwrap();
|
|
|
|
|
|
|
|
assert!(!walker.pattern_filter(Path::new("a")));
|
|
|
|
assert!(walker.pattern_filter(Path::new("b")));
|
|
|
|
assert!(walker.pattern_filter(Path::new("c")));
|
|
|
|
}
|
2020-02-06 01:01:44 +01:00
|
|
|
}
|