2022-01-11 12:59:39 +01:00
|
|
|
use std::path::{Path, PathBuf};
|
|
|
|
|
|
|
|
use futures::stream::{FuturesUnordered, StreamExt};
|
|
|
|
use ignore::{
|
|
|
|
gitignore::{Gitignore, GitignoreBuilder},
|
|
|
|
Match,
|
|
|
|
};
|
|
|
|
use tokio::fs::read_to_string;
|
|
|
|
use tracing::{trace, trace_span};
|
|
|
|
|
|
|
|
use crate::{
|
|
|
|
error::RuntimeError,
|
|
|
|
event::{Event, FileType},
|
|
|
|
filter::Filterer,
|
|
|
|
};
|
|
|
|
|
|
|
|
use super::files::IgnoreFile;
|
|
|
|
|
|
|
|
/// A path-only filterer dedicated to ignore files.
|
|
|
|
///
|
|
|
|
/// This reads and compiles ignore files, and should be used for handling ignore files. It's created
|
|
|
|
/// with a project origin and a list of ignore files, and new ignore files can be added later
|
|
|
|
/// (unless [`finish`](Filter::finish()) is called).
|
|
|
|
///
|
|
|
|
/// It implements [`Filterer`] so it can be used directly in another filterer; it is not designed to
|
|
|
|
/// be used as a standalone filterer.
|
|
|
|
#[derive(Debug)]
|
2022-01-15 03:12:32 +01:00
|
|
|
pub struct IgnoreFilterer {
|
2022-01-11 12:59:39 +01:00
|
|
|
origin: PathBuf,
|
|
|
|
builder: Option<GitignoreBuilder>,
|
|
|
|
compiled: Gitignore,
|
|
|
|
}
|
|
|
|
|
2022-01-15 03:12:32 +01:00
|
|
|
impl IgnoreFilterer {
|
2022-01-11 12:59:39 +01:00
|
|
|
/// Read ignore files from disk and load them for filtering.
|
|
|
|
pub async fn new(origin: impl AsRef<Path>, files: &[IgnoreFile]) -> Result<Self, RuntimeError> {
|
2022-01-15 11:46:06 +01:00
|
|
|
let origin = origin.as_ref();
|
|
|
|
let _span = trace_span!("build_filterer", ?origin);
|
|
|
|
|
|
|
|
trace!(files=%files.len(), "loading file contents");
|
2022-01-11 12:59:39 +01:00
|
|
|
let (files_contents, errors): (Vec<_>, Vec<_>) = files
|
|
|
|
.iter()
|
|
|
|
.map(|file| async move {
|
|
|
|
trace!(?file, "loading ignore file");
|
|
|
|
let content = read_to_string(&file.path).await.map_err(|err| {
|
|
|
|
RuntimeError::IgnoreFileRead {
|
|
|
|
file: file.path.clone(),
|
|
|
|
err,
|
|
|
|
}
|
|
|
|
})?;
|
|
|
|
Ok((file.clone(), content))
|
|
|
|
})
|
|
|
|
.collect::<FuturesUnordered<_>>()
|
|
|
|
.collect::<Vec<_>>()
|
|
|
|
.await
|
|
|
|
.into_iter()
|
|
|
|
.map(|res| match res {
|
|
|
|
Ok(o) => (Some(o), None),
|
|
|
|
Err(e) => (None, Some(e)),
|
|
|
|
})
|
|
|
|
.unzip();
|
|
|
|
|
|
|
|
let errors: Vec<RuntimeError> = errors.into_iter().flatten().collect();
|
|
|
|
if !errors.is_empty() {
|
2022-01-15 11:46:06 +01:00
|
|
|
trace!("found {} errors", errors.len());
|
2022-01-11 12:59:39 +01:00
|
|
|
return Err(RuntimeError::Set(errors));
|
|
|
|
}
|
|
|
|
|
|
|
|
// TODO: different parser/adapter for non-git-syntax ignore files?
|
|
|
|
|
2022-01-15 11:46:06 +01:00
|
|
|
trace!(files=%files_contents.len(), "building ignore list");
|
2022-01-11 12:59:39 +01:00
|
|
|
let mut builder = GitignoreBuilder::new(origin);
|
|
|
|
for (file, content) in files_contents.into_iter().flatten() {
|
|
|
|
let _span = trace_span!("loading ignore file", ?file).entered();
|
|
|
|
for line in content.lines() {
|
|
|
|
if line.is_empty() || line.starts_with('#') {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
trace!(?line, "adding ignore line");
|
|
|
|
builder
|
|
|
|
.add_line(file.applies_in.clone(), line)
|
|
|
|
.map_err(|err| RuntimeError::IgnoreFileGlob {
|
|
|
|
file: file.path.clone(),
|
|
|
|
err,
|
|
|
|
})?;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
trace!("compiling globset");
|
|
|
|
let compiled = builder
|
|
|
|
.build()
|
|
|
|
.map_err(|err| RuntimeError::IgnoreFileGlob {
|
|
|
|
file: "set of ignores".into(),
|
|
|
|
err,
|
|
|
|
})?;
|
|
|
|
|
|
|
|
trace!(
|
|
|
|
files=%files.len(),
|
|
|
|
ignores=%compiled.num_ignores(),
|
|
|
|
allows=%compiled.num_whitelists(),
|
|
|
|
"ignore files loaded and compiled",
|
|
|
|
);
|
|
|
|
|
|
|
|
Ok(Self {
|
|
|
|
origin: origin.to_owned(),
|
|
|
|
builder: Some(builder),
|
|
|
|
compiled,
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Deletes the internal builder, to save memory.
|
|
|
|
///
|
|
|
|
/// This makes it impossible to add new ignore files without re-compiling the whole set.
|
|
|
|
pub fn finish(&mut self) {
|
|
|
|
self.builder = None;
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Reads and adds an ignore file, if the builder is available.
|
|
|
|
///
|
|
|
|
/// Does nothing silently otherwise.
|
|
|
|
pub async fn add_file(&mut self, file: &IgnoreFile) -> Result<(), RuntimeError> {
|
|
|
|
if let Some(ref mut builder) = self.builder {
|
|
|
|
trace!(?file, "reading ignore file");
|
|
|
|
let content =
|
|
|
|
read_to_string(&file.path)
|
|
|
|
.await
|
|
|
|
.map_err(|err| RuntimeError::IgnoreFileRead {
|
|
|
|
file: file.path.clone(),
|
|
|
|
err,
|
|
|
|
})?;
|
|
|
|
|
|
|
|
let _span = trace_span!("loading ignore file", ?file).entered();
|
|
|
|
for line in content.lines() {
|
|
|
|
if line.is_empty() || line.starts_with('#') {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
trace!(?line, "adding ignore line");
|
|
|
|
builder
|
|
|
|
.add_line(file.applies_in.clone(), line)
|
|
|
|
.map_err(|err| RuntimeError::IgnoreFileGlob {
|
|
|
|
file: file.path.clone(),
|
|
|
|
err,
|
|
|
|
})?;
|
|
|
|
}
|
|
|
|
|
2022-01-15 14:36:22 +01:00
|
|
|
self.recompile(file.path.clone())?;
|
|
|
|
}
|
|
|
|
|
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
|
|
|
|
fn recompile(&mut self, file: PathBuf) -> Result<(), RuntimeError> {
|
|
|
|
if let Some(builder) = &mut self.builder {
|
2022-01-11 12:59:39 +01:00
|
|
|
let pre_ignores = self.compiled.num_ignores();
|
|
|
|
let pre_allows = self.compiled.num_whitelists();
|
|
|
|
|
|
|
|
trace!("recompiling globset");
|
|
|
|
let recompiled = builder
|
|
|
|
.build()
|
|
|
|
.map_err(|err| RuntimeError::IgnoreFileGlob {
|
2022-01-15 14:36:22 +01:00
|
|
|
file,
|
2022-01-11 12:59:39 +01:00
|
|
|
err,
|
|
|
|
})?;
|
|
|
|
|
|
|
|
trace!(
|
|
|
|
new_ignores=%(recompiled.num_ignores() - pre_ignores),
|
|
|
|
new_allows=%(recompiled.num_whitelists() - pre_allows),
|
|
|
|
"ignore file loaded and set recompiled",
|
|
|
|
);
|
|
|
|
self.compiled = recompiled;
|
|
|
|
}
|
|
|
|
|
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
|
2022-01-15 14:36:22 +01:00
|
|
|
/// Adds some globs manually, if the builder is available.
|
|
|
|
///
|
|
|
|
/// Does nothing silently otherwise.
|
|
|
|
pub async fn add_globs(&mut self, globs: &[&str], applies_in: Option<PathBuf>) -> Result<(), RuntimeError> {
|
|
|
|
if let Some(ref mut builder) = self.builder {
|
|
|
|
let _span = trace_span!("loading ignore globs", ?globs).entered();
|
|
|
|
for line in globs {
|
|
|
|
if line.is_empty() || line.starts_with('#') {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
trace!(?line, "adding ignore line");
|
|
|
|
builder
|
|
|
|
.add_line(applies_in.clone(), line)
|
|
|
|
.map_err(|err| RuntimeError::IgnoreFileGlob {
|
|
|
|
file: "manual glob".into(),
|
|
|
|
err,
|
|
|
|
})?;
|
|
|
|
}
|
|
|
|
|
|
|
|
self.recompile("manual glob".into())?;
|
|
|
|
}
|
|
|
|
|
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
|
2022-01-11 12:59:39 +01:00
|
|
|
/// Check a particular folder path against the ignore set.
|
|
|
|
///
|
|
|
|
/// Returns `false` if the folder should be ignored.
|
|
|
|
///
|
|
|
|
/// Note that this is a slightly different implementation than the [`Filterer`] trait, as the
|
|
|
|
/// latter handles events with multiple associated paths.
|
|
|
|
pub fn check_dir(&self, path: &Path) -> bool {
|
|
|
|
let _span = trace_span!("check_dir", ?path).entered();
|
|
|
|
|
|
|
|
trace!("checking against compiled ignore files");
|
|
|
|
match if path.strip_prefix(&self.origin).is_ok() {
|
|
|
|
trace!("checking against path or parents");
|
|
|
|
self.compiled.matched_path_or_any_parents(path, true)
|
|
|
|
} else {
|
|
|
|
trace!("checking against path only");
|
|
|
|
self.compiled.matched(path, true)
|
|
|
|
} {
|
|
|
|
Match::None => {
|
|
|
|
trace!("no match (pass)");
|
|
|
|
true
|
|
|
|
}
|
|
|
|
Match::Ignore(glob) => {
|
|
|
|
if glob.from().map_or(true, |f| path.strip_prefix(f).is_ok()) {
|
|
|
|
trace!(?glob, "positive match (fail)");
|
|
|
|
false
|
|
|
|
} else {
|
|
|
|
trace!(?glob, "positive match, but not in scope (pass)");
|
|
|
|
true
|
|
|
|
}
|
|
|
|
}
|
|
|
|
Match::Whitelist(glob) => {
|
|
|
|
trace!(?glob, "negative match (pass)");
|
|
|
|
true
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-01-15 03:12:32 +01:00
|
|
|
impl Filterer for IgnoreFilterer {
|
2022-01-11 12:59:39 +01:00
|
|
|
/// Filter an event.
|
|
|
|
///
|
|
|
|
/// This implementation never errors. It returns `Ok(false)` if the event is ignored according
|
|
|
|
/// to the ignore files, and `Ok(true)` otherwise.
|
|
|
|
fn check_event(&self, event: &Event) -> Result<bool, RuntimeError> {
|
|
|
|
let _span = trace_span!("filterer_check").entered();
|
|
|
|
let mut pass = true;
|
|
|
|
|
|
|
|
for (path, file_type) in event.paths() {
|
2022-01-15 11:46:06 +01:00
|
|
|
let _span = trace_span!("checking_against_compiled", ?path, ?file_type).entered();
|
2022-01-11 12:59:39 +01:00
|
|
|
let is_dir = file_type
|
|
|
|
.map(|t| matches!(t, FileType::Dir))
|
|
|
|
.unwrap_or(false);
|
|
|
|
|
|
|
|
match if path.strip_prefix(&self.origin).is_ok() {
|
|
|
|
trace!("checking against path or parents");
|
|
|
|
self.compiled.matched_path_or_any_parents(path, is_dir)
|
|
|
|
} else {
|
|
|
|
trace!("checking against path only");
|
|
|
|
self.compiled.matched(path, is_dir)
|
|
|
|
} {
|
|
|
|
Match::None => {
|
|
|
|
trace!("no match (pass)");
|
|
|
|
pass &= true;
|
|
|
|
}
|
|
|
|
Match::Ignore(glob) => {
|
|
|
|
if glob.from().map_or(true, |f| path.strip_prefix(f).is_ok()) {
|
|
|
|
trace!(?glob, "positive match (fail)");
|
|
|
|
pass &= false;
|
|
|
|
} else {
|
|
|
|
trace!(?glob, "positive match, but not in scope (ignore)");
|
|
|
|
}
|
|
|
|
}
|
|
|
|
Match::Whitelist(glob) => {
|
|
|
|
trace!(?glob, "negative match (pass)");
|
|
|
|
pass = true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
trace!(?pass, "verdict");
|
|
|
|
Ok(pass)
|
|
|
|
}
|
|
|
|
}
|