##// END OF EJS Templates
rust-revlog: add compression helpers...
rust-revlog: add compression helpers This will be used in the upcoming `InnerRevlog` when reading/writing data.

File last commit:

r53006:b2e90465 merge default
r53051:0744248c default
Show More
matchers.rs
2454 lines | 77.9 KiB | application/rls-services+xml | RustLexer
Raphaël Gomès
rust-matchers: add `Matcher` trait and implement `AlwaysMatcher`...
r43742 // matchers.rs
//
// Copyright 2019 Raphaël Gomès <rgomes@octobus.net>
//
// This software may be used and distributed according to the terms of the
// GNU General Public License version 2 or any later version.
//! Structs and types for matching files and directories.
Raphaël Gomès
rust-matchers: fix quadratic complexity in `FileMatcher`...
r52002 use format_bytes::format_bytes;
use once_cell::sync::OnceCell;
Raphaël Gomès
rust-matchers: add function to generate a regex matcher function...
r45006 use crate::{
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 dirstate::dirs_multiset::DirsChildrenMultiset,
filepatterns::{
build_single_regex, filter_subincludes, get_patterns_from_file,
Simon Sapin
rust: Parse "subinclude"d files along the way, not later...
r48170 PatternFileWarning, PatternResult,
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 },
utils::{
Arseniy Alekseyev
matchers: fix the bug in rust PatternMatcher that made it cut off early...
r52459 files::{dir_ancestors, find_dirs},
Spencer Baugh
rust: improve the type on DirsMultiset::from_manifest...
r51753 hg_path::{HgPath, HgPathBuf, HgPathError},
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 Escaped,
},
Spencer Baugh
rust: improve the type on DirsMultiset::from_manifest...
r51753 DirsMultiset, FastHashMap, IgnorePattern, PatternError, PatternSyntax,
Raphaël Gomès
rust-matchers: add function to generate a regex matcher function...
r45006 };
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009
Arseniy Alekseyev
rhg: refactor to use IgnoreFnType alias more widely...
r49177 use crate::dirstate::status::IgnoreFnType;
Raphaël Gomès
rust-filepatterns: match exact `rootglob`s with a `HashSet`, not in the regex...
r45311 use crate::filepatterns::normalize_path_bytes;
Raphaël Gomès
rust-matchers: add `Matcher` trait and implement `AlwaysMatcher`...
r43742 use std::collections::HashSet;
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 use std::fmt::{Display, Error, Formatter};
Raphaël Gomès
rust-status: only involve ignore mechanism when needed...
r45088 use std::path::{Path, PathBuf};
Raphaël Gomès
rust-matchers: fix quadratic complexity in `FileMatcher`...
r52002 use std::{borrow::ToOwned, collections::BTreeSet};
Raphaël Gomès
rust-matchers: add `Matcher` trait and implement `AlwaysMatcher`...
r43742
Raphaël Gomès
rust-matchers: implement `visit_children_set` for `FileMatcher`...
r44828 #[derive(Debug, PartialEq)]
Raphaël Gomès
rust: use owned types in `Matcher`...
r50241 pub enum VisitChildrenSet {
Raphaël Gomès
rust-matchers: add `Matcher` trait and implement `AlwaysMatcher`...
r43742 /// Don't visit anything
Empty,
Arseniy Alekseyev
tests: add tests and document expectations from visit_children_set in rust...
r52457 /// Visit this directory and probably its children
Raphaël Gomès
rust-matchers: add `Matcher` trait and implement `AlwaysMatcher`...
r43742 This,
Arseniy Alekseyev
tests: add tests and document expectations from visit_children_set in rust...
r52457 /// Only visit the children (both files and directories) if they
/// are mentioned in this set. (empty set corresponds to [Empty])
Raphaël Gomès
rust-matchers: add `Matcher` trait and implement `AlwaysMatcher`...
r43742 /// TODO Should we implement a `NonEmptyHashSet`?
Raphaël Gomès
rust: use owned types in `Matcher`...
r50241 Set(HashSet<HgPathBuf>),
Raphaël Gomès
rust-matchers: add `Matcher` trait and implement `AlwaysMatcher`...
r43742 /// Visit this directory and all subdirectories
Arseniy Alekseyev
tests: add tests and document expectations from visit_children_set in rust...
r52457 /// (you can stop asking about the children set)
Raphaël Gomès
rust-matchers: add `Matcher` trait and implement `AlwaysMatcher`...
r43742 Recursive,
}
Raphaël Gomès
rust: add Debug constraint to Matcher trait...
r50381 pub trait Matcher: core::fmt::Debug {
Raphaël Gomès
rust-matchers: add `Matcher` trait and implement `AlwaysMatcher`...
r43742 /// Explicitly listed files
Raphaël Gomès
rust: use owned types in `Matcher`...
r50241 fn file_set(&self) -> Option<&HashSet<HgPathBuf>>;
Raphaël Gomès
rust-matchers: add `Matcher` trait and implement `AlwaysMatcher`...
r43742 /// Returns whether `filename` is in `file_set`
Raphaël Gomès
rust-matchers: make `Matcher` trait object-safe...
r46182 fn exact_match(&self, filename: &HgPath) -> bool;
Raphaël Gomès
rust-matchers: add `Matcher` trait and implement `AlwaysMatcher`...
r43742 /// Returns whether `filename` is matched by this matcher
Raphaël Gomès
rust-matchers: make `Matcher` trait object-safe...
r46182 fn matches(&self, filename: &HgPath) -> bool;
Raphaël Gomès
rust-matchers: add `Matcher` trait and implement `AlwaysMatcher`...
r43742 /// Decides whether a directory should be visited based on whether it
/// has potential matches in it or one of its subdirectories, and
/// potentially lists which subdirectories of that directory should be
/// visited. This is based on the match's primary, included, and excluded
/// patterns.
///
/// # Example
///
/// Assume matchers `['path:foo/bar', 'rootfilesin:qux']`, we would
/// return the following values (assuming the implementation of
/// visit_children_set is capable of recognizing this; some implementations
/// are not).
///
Georges Racinet
rust-matchers: fixing cargo doc...
r44458 /// ```text
Raphaël Gomès
rust-matchers: add `Matcher` trait and implement `AlwaysMatcher`...
r43742 /// ```ignore
/// '' -> {'foo', 'qux'}
/// 'baz' -> set()
/// 'foo' -> {'bar'}
/// // Ideally this would be `Recursive`, but since the prefix nature of
/// // matchers is applied to the entire matcher, we have to downgrade this
/// // to `This` due to the (yet to be implemented in Rust) non-prefix
/// // `RootFilesIn'-kind matcher being mixed in.
/// 'foo/bar' -> 'this'
/// 'qux' -> 'this'
/// ```
/// # Important
///
/// Most matchers do not know if they're representing files or
/// directories. They see `['path:dir/f']` and don't know whether `f` is a
/// file or a directory, so `visit_children_set('dir')` for most matchers
/// will return `HashSet{ HgPath { "f" } }`, but if the matcher knows it's
/// a file (like the yet to be implemented in Rust `ExactMatcher` does),
/// it may return `VisitChildrenSet::This`.
/// Do not rely on the return being a `HashSet` indicating that there are
/// no files in this dir to investigate (or equivalently that if there are
/// files to investigate in 'dir' that it will always return
/// `VisitChildrenSet::This`).
Raphaël Gomès
rust-matchers: make `Matcher` trait object-safe...
r46182 fn visit_children_set(&self, directory: &HgPath) -> VisitChildrenSet;
Raphaël Gomès
rust-matchers: add `Matcher` trait and implement `AlwaysMatcher`...
r43742 /// Matcher will match everything and `files_set()` will be empty:
/// optimization might be possible.
Raphaël Gomès
rust-matchers: remove default implementations for `Matcher` trait...
r44009 fn matches_everything(&self) -> bool;
Raphaël Gomès
rust-matchers: add `Matcher` trait and implement `AlwaysMatcher`...
r43742 /// Matcher will match exactly the files in `files_set()`: optimization
/// might be possible.
Raphaël Gomès
rust-matchers: remove default implementations for `Matcher` trait...
r44009 fn is_exact(&self) -> bool;
Raphaël Gomès
rust-matchers: add `Matcher` trait and implement `AlwaysMatcher`...
r43742 }
/// Matches everything.
Raphaël Gomès
rust-matchers: add doctests for `AlwaysMatcher`...
r44286 ///```
/// use hg::{ matchers::{Matcher, AlwaysMatcher}, utils::hg_path::HgPath };
///
/// let matcher = AlwaysMatcher;
///
Raphaël Gomès
rust-matchers: add `FileMatcher` implementation...
r44366 /// assert_eq!(matcher.matches(HgPath::new(b"whatever")), true);
/// assert_eq!(matcher.matches(HgPath::new(b"b.txt")), true);
/// assert_eq!(matcher.matches(HgPath::new(b"main.c")), true);
/// assert_eq!(matcher.matches(HgPath::new(br"re:.*\.c$")), true);
Raphaël Gomès
rust-matchers: add doctests for `AlwaysMatcher`...
r44286 /// ```
Raphaël Gomès
rust-matchers: add `Matcher` trait and implement `AlwaysMatcher`...
r43742 #[derive(Debug)]
pub struct AlwaysMatcher;
impl Matcher for AlwaysMatcher {
Raphaël Gomès
rust: use owned types in `Matcher`...
r50241 fn file_set(&self) -> Option<&HashSet<HgPathBuf>> {
Raphaël Gomès
rust-matchers: improve `Matcher` trait ergonomics...
r44284 None
Raphaël Gomès
rust-matchers: add `Matcher` trait and implement `AlwaysMatcher`...
r43742 }
Raphaël Gomès
rust-matchers: make `Matcher` trait object-safe...
r46182 fn exact_match(&self, _filename: &HgPath) -> bool {
Raphaël Gomès
rust-matchers: remove default implementations for `Matcher` trait...
r44009 false
}
Raphaël Gomès
rust-matchers: make `Matcher` trait object-safe...
r46182 fn matches(&self, _filename: &HgPath) -> bool {
Raphaël Gomès
rust-matchers: remove default implementations for `Matcher` trait...
r44009 true
}
Raphaël Gomès
rust-matchers: make `Matcher` trait object-safe...
r46182 fn visit_children_set(&self, _directory: &HgPath) -> VisitChildrenSet {
Raphaël Gomès
rust-matchers: add `Matcher` trait and implement `AlwaysMatcher`...
r43742 VisitChildrenSet::Recursive
}
Raphaël Gomès
rust-matchers: remove default implementations for `Matcher` trait...
r44009 fn matches_everything(&self) -> bool {
true
}
fn is_exact(&self) -> bool {
false
}
Raphaël Gomès
rust-matchers: add `Matcher` trait and implement `AlwaysMatcher`...
r43742 }
Raphaël Gomès
rust-matchers: add `FileMatcher` implementation...
r44366
Raphaël Gomès
rust-dirstate: add support for nevermatcher...
r50247 /// Matches nothing.
#[derive(Debug)]
pub struct NeverMatcher;
impl Matcher for NeverMatcher {
fn file_set(&self) -> Option<&HashSet<HgPathBuf>> {
None
}
fn exact_match(&self, _filename: &HgPath) -> bool {
false
}
fn matches(&self, _filename: &HgPath) -> bool {
false
}
fn visit_children_set(&self, _directory: &HgPath) -> VisitChildrenSet {
VisitChildrenSet::Empty
}
fn matches_everything(&self) -> bool {
false
}
fn is_exact(&self) -> bool {
true
}
}
Raphaël Gomès
rust-matchers: add `FileMatcher` implementation...
r44366 /// Matches the input files exactly. They are interpreted as paths, not
/// patterns.
///
///```
Raphaël Gomès
rust-matchers: make `Matcher` trait object-safe...
r46182 /// use hg::{ matchers::{Matcher, FileMatcher}, utils::hg_path::{HgPath, HgPathBuf} };
Raphaël Gomès
rust-matchers: add `FileMatcher` implementation...
r44366 ///
Raphaël Gomès
rust: use owned types in `Matcher`...
r50241 /// let files = vec![HgPathBuf::from_bytes(b"a.txt"), HgPathBuf::from_bytes(br"re:.*\.c$")];
/// let matcher = FileMatcher::new(files).unwrap();
Raphaël Gomès
rust-matchers: add `FileMatcher` implementation...
r44366 ///
/// assert_eq!(matcher.matches(HgPath::new(b"a.txt")), true);
/// assert_eq!(matcher.matches(HgPath::new(b"b.txt")), false);
/// assert_eq!(matcher.matches(HgPath::new(b"main.c")), false);
/// assert_eq!(matcher.matches(HgPath::new(br"re:.*\.c$")), true);
/// ```
#[derive(Debug)]
Raphaël Gomès
rust: use owned types in `Matcher`...
r50241 pub struct FileMatcher {
files: HashSet<HgPathBuf>,
Raphaël Gomès
rust-matchers: add `FileMatcher` implementation...
r44366 dirs: DirsMultiset,
Raphaël Gomès
rust-matchers: fix quadratic complexity in `FileMatcher`...
r52002 sorted_visitchildrenset_candidates: OnceCell<BTreeSet<HgPathBuf>>,
Raphaël Gomès
rust-matchers: add `FileMatcher` implementation...
r44366 }
Raphaël Gomès
rust: use owned types in `Matcher`...
r50241 impl FileMatcher {
Spencer Baugh
rust: improve the type on DirsMultiset::from_manifest...
r51753 pub fn new(files: Vec<HgPathBuf>) -> Result<Self, HgPathError> {
Raphaël Gomès
rust: use owned types in `Matcher`...
r50241 let dirs = DirsMultiset::from_manifest(&files)?;
Raphaël Gomès
rust-matchers: add `FileMatcher` implementation...
r44366 Ok(Self {
Raphaël Gomès
rust: run a clippy pass with the latest stable version...
r52013 files: HashSet::from_iter(files),
Raphaël Gomès
rust: use owned types in `Matcher`...
r50241 dirs,
Raphaël Gomès
rust-matchers: fix quadratic complexity in `FileMatcher`...
r52002 sorted_visitchildrenset_candidates: OnceCell::new(),
Raphaël Gomès
rust-matchers: add `FileMatcher` implementation...
r44366 })
}
Raphaël Gomès
rust-matchers: make `Matcher` trait object-safe...
r46182 fn inner_matches(&self, filename: &HgPath) -> bool {
Raphaël Gomès
rust-matchers: add `FileMatcher` implementation...
r44366 self.files.contains(filename.as_ref())
}
}
Raphaël Gomès
rust: use owned types in `Matcher`...
r50241 impl Matcher for FileMatcher {
fn file_set(&self) -> Option<&HashSet<HgPathBuf>> {
Raphaël Gomès
rust-matchers: add `FileMatcher` implementation...
r44366 Some(&self.files)
}
Raphaël Gomès
rust-matchers: make `Matcher` trait object-safe...
r46182 fn exact_match(&self, filename: &HgPath) -> bool {
Raphaël Gomès
rust-matchers: add `FileMatcher` implementation...
r44366 self.inner_matches(filename)
}
Raphaël Gomès
rust-matchers: make `Matcher` trait object-safe...
r46182 fn matches(&self, filename: &HgPath) -> bool {
Raphaël Gomès
rust-matchers: add `FileMatcher` implementation...
r44366 self.inner_matches(filename)
}
Raphaël Gomès
rust-matchers: make `Matcher` trait object-safe...
r46182 fn visit_children_set(&self, directory: &HgPath) -> VisitChildrenSet {
Raphaël Gomès
rust-matchers: fix quadratic complexity in `FileMatcher`...
r52002 if self.files.is_empty() || !self.dirs.contains(directory) {
Raphaël Gomès
rust-matchers: implement `visit_children_set` for `FileMatcher`...
r44828 return VisitChildrenSet::Empty;
}
Raphaël Gomès
rust-matchers: fix quadratic complexity in `FileMatcher`...
r52002 let compute_candidates = || -> BTreeSet<HgPathBuf> {
let mut candidates: BTreeSet<HgPathBuf> =
self.dirs.iter().cloned().collect();
candidates.extend(self.files.iter().cloned());
candidates.remove(HgPath::new(b""));
candidates
};
let candidates =
if directory.as_ref().is_empty() {
compute_candidates()
} else {
let sorted_candidates = self
.sorted_visitchildrenset_candidates
.get_or_init(compute_candidates);
let directory_bytes = directory.as_ref().as_bytes();
let start: HgPathBuf =
format_bytes!(b"{}/", directory_bytes).into();
let start_len = start.len();
// `0` sorts after `/`
let end = format_bytes!(b"{}0", directory_bytes).into();
BTreeSet::from_iter(sorted_candidates.range(start..end).map(
|c| HgPathBuf::from_bytes(&c.as_bytes()[start_len..]),
))
};
Raphaël Gomès
rust-matchers: implement `visit_children_set` for `FileMatcher`...
r44828
// `self.dirs` includes all of the directories, recursively, so if
// we're attempting to match 'foo/bar/baz.txt', it'll have '', 'foo',
// 'foo/bar' in it. Thus we can safely ignore a candidate that has a
// '/' in it, indicating it's for a subdir-of-a-subdir; the immediate
// subdir will be in there without a slash.
VisitChildrenSet::Set(
candidates
Raphaël Gomès
rust: use owned types in `Matcher`...
r50241 .into_iter()
Raphaël Gomès
rust-matchers: implement `visit_children_set` for `FileMatcher`...
r44828 .filter_map(|c| {
if c.bytes().all(|b| *b != b'/') {
Raphaël Gomès
rust: use owned types in `Matcher`...
r50241 Some(c)
Raphaël Gomès
rust-matchers: implement `visit_children_set` for `FileMatcher`...
r44828 } else {
None
}
})
.collect(),
)
Raphaël Gomès
rust-matchers: add `FileMatcher` implementation...
r44366 }
fn matches_everything(&self) -> bool {
false
}
fn is_exact(&self) -> bool {
true
}
}
Raphaël Gomès
rust-matchers: add function to generate a regex matcher function...
r45006
Spencer Baugh
rust-matchers: add PatternMatcher...
r51758 /// Matches a set of (kind, pat, source) against a 'root' directory.
/// (Currently the 'root' directory is effectively always empty)
/// ```
/// use hg::{
/// matchers::{PatternMatcher, Matcher},
/// IgnorePattern,
/// PatternSyntax,
/// utils::hg_path::{HgPath, HgPathBuf}
/// };
/// use std::collections::HashSet;
/// use std::path::Path;
/// ///
/// let ignore_patterns : Vec<IgnorePattern> =
/// vec![IgnorePattern::new(PatternSyntax::Regexp, br".*\.c$", Path::new("")),
/// IgnorePattern::new(PatternSyntax::Path, b"foo/a", Path::new("")),
/// IgnorePattern::new(PatternSyntax::RelPath, b"b", Path::new("")),
/// IgnorePattern::new(PatternSyntax::Glob, b"*.h", Path::new("")),
/// ];
/// let matcher = PatternMatcher::new(ignore_patterns).unwrap();
/// ///
/// assert_eq!(matcher.matches(HgPath::new(b"main.c")), true); // matches re:.*\.c$
/// assert_eq!(matcher.matches(HgPath::new(b"b.txt")), false);
/// assert_eq!(matcher.matches(HgPath::new(b"foo/a")), true); // matches path:foo/a
/// assert_eq!(matcher.matches(HgPath::new(b"a")), false); // does not match path:b, since 'root' is 'foo'
/// assert_eq!(matcher.matches(HgPath::new(b"b")), true); // matches relpath:b, since 'root' is 'foo'
/// assert_eq!(matcher.matches(HgPath::new(b"lib.h")), true); // matches glob:*.h
/// assert_eq!(matcher.file_set().unwrap(),
/// &HashSet::from([HgPathBuf::from_bytes(b""), HgPathBuf::from_bytes(b"foo/a"),
/// HgPathBuf::from_bytes(b""), HgPathBuf::from_bytes(b"b")]));
/// assert_eq!(matcher.exact_match(HgPath::new(b"foo/a")), true);
/// assert_eq!(matcher.exact_match(HgPath::new(b"b")), true);
/// assert_eq!(matcher.exact_match(HgPath::new(b"lib.h")), false); // exact matches are for (rel)path kinds
/// ```
pub struct PatternMatcher<'a> {
patterns: Vec<u8>,
match_fn: IgnoreFnType<'a>,
/// Whether all the patterns match a prefix (i.e. recursively)
prefix: bool,
files: HashSet<HgPathBuf>,
Arseniy Alekseyev
match: fix the rust-side bug in visit_children_set for rootfilesin matchers...
r52463 dirs_explicit: HashSet<HgPathBuf>,
Spencer Baugh
rust-matchers: add PatternMatcher...
r51758 dirs: DirsMultiset,
}
impl core::fmt::Debug for PatternMatcher<'_> {
fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
f.debug_struct("PatternMatcher")
.field("patterns", &String::from_utf8_lossy(&self.patterns))
.field("prefix", &self.prefix)
.field("files", &self.files)
.field("dirs", &self.dirs)
.finish()
}
}
impl<'a> PatternMatcher<'a> {
pub fn new(ignore_patterns: Vec<IgnorePattern>) -> PatternResult<Self> {
Arseniy Alekseyev
match: fix the rust-side bug in visit_children_set for rootfilesin matchers...
r52463 let RootsDirsAndParents {
roots,
dirs: dirs_explicit,
parents,
} = roots_dirs_and_parents(&ignore_patterns)?;
let files = roots;
let dirs = parents;
Raphaël Gomès
rust: run a clippy pass with the latest stable version...
r52013 let files: HashSet<HgPathBuf> = HashSet::from_iter(files);
Spencer Baugh
rust-matchers: add PatternMatcher...
r51758
let prefix = ignore_patterns.iter().all(|k| {
matches!(k.syntax, PatternSyntax::Path | PatternSyntax::RelPath)
});
let (patterns, match_fn) = build_match(ignore_patterns, b"$")?;
Ok(Self {
patterns,
match_fn,
prefix,
files,
dirs,
Arseniy Alekseyev
match: fix the rust-side bug in visit_children_set for rootfilesin matchers...
r52463 dirs_explicit,
Spencer Baugh
rust-matchers: add PatternMatcher...
r51758 })
}
}
impl<'a> Matcher for PatternMatcher<'a> {
fn file_set(&self) -> Option<&HashSet<HgPathBuf>> {
Some(&self.files)
}
fn exact_match(&self, filename: &HgPath) -> bool {
self.files.contains(filename)
}
fn matches(&self, filename: &HgPath) -> bool {
if self.files.contains(filename) {
return true;
}
(self.match_fn)(filename)
}
fn visit_children_set(&self, directory: &HgPath) -> VisitChildrenSet {
if self.prefix && self.files.contains(directory) {
return VisitChildrenSet::Recursive;
}
Arseniy Alekseyev
match: small tweak to PatternMatcher.visit_children_set...
r52460 if self.dirs.contains(directory) {
return VisitChildrenSet::This;
}
Arseniy Alekseyev
match: fix the rust-side bug in visit_children_set for rootfilesin matchers...
r52463 if dir_ancestors(directory).any(|parent_dir| {
self.files.contains(parent_dir)
|| self.dirs_explicit.contains(parent_dir)
}) {
Spencer Baugh
rust-matchers: add PatternMatcher...
r51758 VisitChildrenSet::This
} else {
VisitChildrenSet::Empty
}
}
fn matches_everything(&self) -> bool {
false
}
fn is_exact(&self) -> bool {
false
}
}
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 /// Matches files that are included in the ignore rules.
Raphaël Gomès
rust: remove support for `re2`...
r45406 /// ```
/// use hg::{
/// matchers::{IncludeMatcher, Matcher},
/// IgnorePattern,
/// PatternSyntax,
/// utils::hg_path::HgPath
/// };
/// use std::path::Path;
/// ///
/// let ignore_patterns =
/// vec![IgnorePattern::new(PatternSyntax::RootGlob, b"this*", Path::new(""))];
Simon Sapin
rust: Parse "subinclude"d files along the way, not later...
r48170 /// let matcher = IncludeMatcher::new(ignore_patterns).unwrap();
Raphaël Gomès
rust: remove support for `re2`...
r45406 /// ///
/// assert_eq!(matcher.matches(HgPath::new(b"testing")), false);
/// assert_eq!(matcher.matches(HgPath::new(b"this should work")), true);
/// assert_eq!(matcher.matches(HgPath::new(b"this also")), true);
/// assert_eq!(matcher.matches(HgPath::new(b"but not this")), false);
Martin von Zweigbergk
matchers: use correct method for finding index in vector...
r52167 /// ///
/// let ignore_patterns =
Arseniy Alekseyev
match: rename RootFiles to RootFilesIn for more consistency
r52461 /// vec![IgnorePattern::new(PatternSyntax::RootFilesIn, b"dir/subdir", Path::new(""))];
Martin von Zweigbergk
matchers: use correct method for finding index in vector...
r52167 /// let matcher = IncludeMatcher::new(ignore_patterns).unwrap();
/// ///
/// assert!(!matcher.matches(HgPath::new(b"file")));
/// assert!(!matcher.matches(HgPath::new(b"dir/file")));
/// assert!(matcher.matches(HgPath::new(b"dir/subdir/file")));
/// assert!(!matcher.matches(HgPath::new(b"dir/subdir/subsubdir/file")));
Raphaël Gomès
rust: remove support for `re2`...
r45406 /// ```
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 pub struct IncludeMatcher<'a> {
patterns: Vec<u8>,
Arseniy Alekseyev
rhg: refactor to use IgnoreFnType alias more widely...
r49177 match_fn: IgnoreFnType<'a>,
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 /// Whether all the patterns match a prefix (i.e. recursively)
prefix: bool,
roots: HashSet<HgPathBuf>,
dirs: HashSet<HgPathBuf>,
Arseniy Alekseyev
match: fix the rust-side bug in visit_children_set for rootfilesin matchers...
r52463 parents: DirsMultiset,
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 }
Raphaël Gomès
rust: add Debug constraint to Matcher trait...
r50381 impl core::fmt::Debug for IncludeMatcher<'_> {
fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
f.debug_struct("IncludeMatcher")
.field("patterns", &String::from_utf8_lossy(&self.patterns))
.field("prefix", &self.prefix)
.field("roots", &self.roots)
.field("dirs", &self.dirs)
.field("parents", &self.parents)
.finish()
}
}
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 impl<'a> Matcher for IncludeMatcher<'a> {
Raphaël Gomès
rust: use owned types in `Matcher`...
r50241 fn file_set(&self) -> Option<&HashSet<HgPathBuf>> {
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 None
}
Raphaël Gomès
rust-matchers: make `Matcher` trait object-safe...
r46182 fn exact_match(&self, _filename: &HgPath) -> bool {
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 false
}
Raphaël Gomès
rust-matchers: make `Matcher` trait object-safe...
r46182 fn matches(&self, filename: &HgPath) -> bool {
Raphaël Gomès
rust-clippy: fix most warnings in `hg-core`...
r50825 (self.match_fn)(filename)
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 }
Raphaël Gomès
rust-matchers: make `Matcher` trait object-safe...
r46182 fn visit_children_set(&self, directory: &HgPath) -> VisitChildrenSet {
Raphaël Gomès
rust-clippy: fix most warnings in `hg-core`...
r50825 let dir = directory;
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 if self.prefix && self.roots.contains(dir) {
return VisitChildrenSet::Recursive;
}
if self.roots.contains(HgPath::new(b""))
|| self.roots.contains(dir)
|| self.dirs.contains(dir)
|| find_dirs(dir).any(|parent_dir| self.roots.contains(parent_dir))
{
return VisitChildrenSet::This;
}
Raphaël Gomès
rust-clippy: fix most warnings in `hg-core`...
r50825 if self.parents.contains(dir.as_ref()) {
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 let multiset = self.get_all_parents_children();
if let Some(children) = multiset.get(dir) {
Raphaël Gomès
rust: use owned types in `Matcher`...
r50241 return VisitChildrenSet::Set(
Raphaël Gomès
rust-clippy: fix most warnings in `hg-core`...
r50825 children.iter().map(HgPathBuf::from).collect(),
Raphaël Gomès
rust: use owned types in `Matcher`...
r50241 );
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 }
}
VisitChildrenSet::Empty
}
fn matches_everything(&self) -> bool {
false
}
fn is_exact(&self) -> bool {
false
}
}
Raphaël Gomès
rust: add UnionMatcher...
r50243 /// The union of multiple matchers. Will match if any of the matchers match.
Raphaël Gomès
rust: add Debug constraint to Matcher trait...
r50381 #[derive(Debug)]
Raphaël Gomès
rust: add UnionMatcher...
r50243 pub struct UnionMatcher {
matchers: Vec<Box<dyn Matcher + Sync>>,
}
impl Matcher for UnionMatcher {
fn file_set(&self) -> Option<&HashSet<HgPathBuf>> {
None
}
fn exact_match(&self, _filename: &HgPath) -> bool {
false
}
fn matches(&self, filename: &HgPath) -> bool {
self.matchers.iter().any(|m| m.matches(filename))
}
fn visit_children_set(&self, directory: &HgPath) -> VisitChildrenSet {
let mut result = HashSet::new();
let mut this = false;
for matcher in self.matchers.iter() {
let visit = matcher.visit_children_set(directory);
match visit {
VisitChildrenSet::Empty => continue,
VisitChildrenSet::This => {
this = true;
// Don't break, we might have an 'all' in here.
continue;
}
VisitChildrenSet::Set(set) => {
result.extend(set);
}
VisitChildrenSet::Recursive => {
return visit;
}
}
}
if this {
return VisitChildrenSet::This;
}
if result.is_empty() {
VisitChildrenSet::Empty
} else {
VisitChildrenSet::Set(result)
}
}
fn matches_everything(&self) -> bool {
// TODO Maybe if all are AlwaysMatcher?
false
}
fn is_exact(&self) -> bool {
false
}
}
impl UnionMatcher {
pub fn new(matchers: Vec<Box<dyn Matcher + Sync>>) -> Self {
Self { matchers }
}
}
Raphaël Gomès
rust: add Debug constraint to Matcher trait...
r50381 #[derive(Debug)]
Raphaël Gomès
rust: add IntersectionMatcher...
r50245 pub struct IntersectionMatcher {
m1: Box<dyn Matcher + Sync>,
m2: Box<dyn Matcher + Sync>,
files: Option<HashSet<HgPathBuf>>,
}
impl Matcher for IntersectionMatcher {
fn file_set(&self) -> Option<&HashSet<HgPathBuf>> {
self.files.as_ref()
}
fn exact_match(&self, filename: &HgPath) -> bool {
self.files.as_ref().map_or(false, |f| f.contains(filename))
}
fn matches(&self, filename: &HgPath) -> bool {
self.m1.matches(filename) && self.m2.matches(filename)
}
fn visit_children_set(&self, directory: &HgPath) -> VisitChildrenSet {
let m1_set = self.m1.visit_children_set(directory);
if m1_set == VisitChildrenSet::Empty {
return VisitChildrenSet::Empty;
}
let m2_set = self.m2.visit_children_set(directory);
if m2_set == VisitChildrenSet::Empty {
return VisitChildrenSet::Empty;
}
if m1_set == VisitChildrenSet::Recursive {
return m2_set;
} else if m2_set == VisitChildrenSet::Recursive {
return m1_set;
}
match (&m1_set, &m2_set) {
(VisitChildrenSet::Recursive, _) => m2_set,
(_, VisitChildrenSet::Recursive) => m1_set,
(VisitChildrenSet::This, _) | (_, VisitChildrenSet::This) => {
VisitChildrenSet::This
}
(VisitChildrenSet::Set(m1), VisitChildrenSet::Set(m2)) => {
Raphaël Gomès
rust-clippy: fix most warnings in `hg-core`...
r50825 let set: HashSet<_> = m1.intersection(m2).cloned().collect();
Raphaël Gomès
rust: add IntersectionMatcher...
r50245 if set.is_empty() {
VisitChildrenSet::Empty
} else {
VisitChildrenSet::Set(set)
}
}
_ => unreachable!(),
}
}
fn matches_everything(&self) -> bool {
self.m1.matches_everything() && self.m2.matches_everything()
}
fn is_exact(&self) -> bool {
self.m1.is_exact() || self.m2.is_exact()
}
}
impl IntersectionMatcher {
pub fn new(
mut m1: Box<dyn Matcher + Sync>,
mut m2: Box<dyn Matcher + Sync>,
) -> Self {
let files = if m1.is_exact() || m2.is_exact() {
if !m1.is_exact() {
std::mem::swap(&mut m1, &mut m2);
}
m1.file_set().map(|m1_files| {
Raphaël Gomès
rust: apply clippy lints...
r52600 m1_files
.iter()
.filter(|&f| m2.matches(f))
.cloned()
.collect()
Raphaël Gomès
rust: add IntersectionMatcher...
r50245 })
} else {
Spencer Baugh
rust-matchers: better support file_set in IntersectionMatcher...
r51749 // without exact input file sets, we can't do an exact
// intersection, so we must over-approximate by
// unioning instead
m1.file_set().map(|m1_files| match m2.file_set() {
Some(m2_files) => m1_files.union(m2_files).cloned().collect(),
None => m1_files.iter().cloned().collect(),
})
Raphaël Gomès
rust: add IntersectionMatcher...
r50245 };
Self { m1, m2, files }
}
}
Raphaël Gomès
rust: add Debug constraint to Matcher trait...
r50381 #[derive(Debug)]
Raphaël Gomès
rust-matchers: implement DifferenceMatcher...
r50373 pub struct DifferenceMatcher {
base: Box<dyn Matcher + Sync>,
excluded: Box<dyn Matcher + Sync>,
files: Option<HashSet<HgPathBuf>>,
}
impl Matcher for DifferenceMatcher {
fn file_set(&self) -> Option<&HashSet<HgPathBuf>> {
self.files.as_ref()
}
fn exact_match(&self, filename: &HgPath) -> bool {
self.files.as_ref().map_or(false, |f| f.contains(filename))
}
fn matches(&self, filename: &HgPath) -> bool {
self.base.matches(filename) && !self.excluded.matches(filename)
}
fn visit_children_set(&self, directory: &HgPath) -> VisitChildrenSet {
let excluded_set = self.excluded.visit_children_set(directory);
if excluded_set == VisitChildrenSet::Recursive {
return VisitChildrenSet::Empty;
}
let base_set = self.base.visit_children_set(directory);
// Possible values for base: 'recursive', 'this', set(...), set()
// Possible values for excluded: 'this', set(...), set()
// If excluded has nothing under here that we care about, return base,
// even if it's 'recursive'.
if excluded_set == VisitChildrenSet::Empty {
return base_set;
}
match base_set {
VisitChildrenSet::This | VisitChildrenSet::Recursive => {
// Never return 'recursive' here if excluded_set is any kind of
// non-empty (either 'this' or set(foo)), since excluded might
// return set() for a subdirectory.
VisitChildrenSet::This
}
set => {
// Possible values for base: set(...), set()
// Possible values for excluded: 'this', set(...)
// We ignore excluded set results. They're possibly incorrect:
// base = path:dir/subdir
// excluded=rootfilesin:dir,
// visit_children_set(''):
// base returns {'dir'}, excluded returns {'dir'}, if we
// subtracted we'd return set(), which is *not* correct, we
// still need to visit 'dir'!
set
}
}
}
fn matches_everything(&self) -> bool {
false
}
fn is_exact(&self) -> bool {
self.base.is_exact()
}
}
impl DifferenceMatcher {
pub fn new(
base: Box<dyn Matcher + Sync>,
excluded: Box<dyn Matcher + Sync>,
) -> Self {
let base_is_exact = base.is_exact();
let base_files = base.file_set().map(ToOwned::to_owned);
let mut new = Self {
base,
excluded,
files: None,
};
if base_is_exact {
new.files = base_files.map(|files| {
Raphaël Gomès
rust: apply clippy lints...
r52600 files.iter().filter(|&f| new.matches(f)).cloned().collect()
Raphaël Gomès
rust-matchers: implement DifferenceMatcher...
r50373 });
}
new
}
}
Raphaël Gomès
rust: create wrapper struct to reduce `regex` contention issues...
r50476 /// Wraps [`regex::bytes::Regex`] to improve performance in multithreaded
/// contexts.
///
/// The `status` algorithm makes heavy use of threads, and calling `is_match`
/// from many threads at once is prone to contention, probably within the
/// scratch space needed as the regex DFA is built lazily.
///
/// We are in the process of raising the issue upstream, but for now
/// the workaround used here is to store the `Regex` in a lazily populated
/// thread-local variable, sharing the initial read-only compilation, but
/// not the lazy dfa scratch space mentioned above.
///
/// This reduces the contention observed with 16+ threads, but does not
/// completely remove it. Hopefully this can be addressed upstream.
struct RegexMatcher {
/// Compiled at the start of the status algorithm, used as a base for
/// cloning in each thread-local `self.local`, thus sharing the expensive
/// first compilation.
base: regex::bytes::Regex,
/// Thread-local variable that holds the `Regex` that is actually queried
/// from each thread.
local: thread_local::ThreadLocal<regex::bytes::Regex>,
}
impl RegexMatcher {
/// Returns whether the path matches the stored `Regex`.
pub fn is_match(&self, path: &HgPath) -> bool {
self.local
.get_or(|| self.base.clone())
.is_match(path.as_bytes())
}
}
Georges Racinet
rust-matchers: raw regular expression builder...
r52364 /// Return a `RegexBuilder` from a bytes pattern
Raphaël Gomès
rust-matchers: use the `regex` crate...
r45084 ///
Georges Racinet
rust-matchers: raw regular expression builder...
r52364 /// This works around the fact that even if it works on byte haysacks,
/// [`regex::bytes::Regex`] still uses UTF-8 patterns.
pub fn re_bytes_builder(pattern: &[u8]) -> regex::bytes::RegexBuilder {
Raphaël Gomès
rust-matchers: use the `regex` crate...
r45084 use std::io::Write;
Raphaël Gomès
rust-regex: fix issues with regex anchoring and performance...
r45347 // The `regex` crate adds `.*` to the start and end of expressions if there
// are no anchors, so add the start anchor.
let mut escaped_bytes = vec![b'^', b'(', b'?', b':'];
Raphaël Gomès
rust-matchers: use the `regex` crate...
r45084 for byte in pattern {
if *byte > 127 {
write!(escaped_bytes, "\\x{:x}", *byte).unwrap();
} else {
escaped_bytes.push(*byte);
}
}
Raphaël Gomès
rust-regex: fix issues with regex anchoring and performance...
r45347 escaped_bytes.push(b')');
Raphaël Gomès
rust-matchers: use the `regex` crate...
r45084
// Avoid the cost of UTF8 checking
//
// # Safety
// This is safe because we escaped all non-ASCII bytes.
let pattern_string = unsafe { String::from_utf8_unchecked(escaped_bytes) };
Georges Racinet
rust-matchers: raw regular expression builder...
r52364 regex::bytes::RegexBuilder::new(&pattern_string)
}
/// Returns a function that matches an `HgPath` against the given regex
/// pattern.
///
/// This can fail when the pattern is invalid or not supported by the
/// underlying engine (the `regex` crate), for instance anything with
/// back-references.
#[logging_timer::time("trace")]
fn re_matcher(pattern: &[u8]) -> PatternResult<RegexMatcher> {
let re = re_bytes_builder(pattern)
Raphaël Gomès
rust-matchers: use the `regex` crate...
r45084 .unicode(false)
Raphaël Gomès
rust-regex: increase the DFA size limit for the `regex` crate...
r45286 // Big repos with big `.hgignore` will hit the default limit and
// incur a significant performance hit. One repo's `hg status` hit
// multiple *minutes*.
.dfa_size_limit(50 * (1 << 20))
Raphaël Gomès
rust-matchers: use the `regex` crate...
r45084 .build()
.map_err(|e| PatternError::UnsupportedSyntax(e.to_string()))?;
Raphaël Gomès
rust: create wrapper struct to reduce `regex` contention issues...
r50476 Ok(RegexMatcher {
base: re,
local: Default::default(),
})
Raphaël Gomès
rust-matchers: add function to generate a regex matcher function...
r45006 }
Raphaël Gomès
rust-matchers: add `build_regex_match` function...
r45008 /// Returns the regex pattern and a function that matches an `HgPath` against
/// said regex formed by the given ignore patterns.
Raphaël Gomès
rust: run a clippy pass with the latest stable version...
r52013 fn build_regex_match<'a>(
ignore_patterns: &[IgnorePattern],
Spencer Baugh
rust: de-hardcode glob_suffix...
r51754 glob_suffix: &[u8],
Raphaël Gomès
rust: run a clippy pass with the latest stable version...
r52013 ) -> PatternResult<(Vec<u8>, IgnoreFnType<'a>)> {
Raphaël Gomès
rust-filepatterns: match exact `rootglob`s with a `HashSet`, not in the regex...
r45311 let mut regexps = vec![];
let mut exact_set = HashSet::new();
for pattern in ignore_patterns {
Spencer Baugh
rust: de-hardcode glob_suffix...
r51754 if let Some(re) = build_single_regex(pattern, glob_suffix)? {
Raphaël Gomès
rust-filepatterns: match exact `rootglob`s with a `HashSet`, not in the regex...
r45311 regexps.push(re);
} else {
let exact = normalize_path_bytes(&pattern.pattern);
exact_set.insert(HgPathBuf::from_bytes(&exact));
}
}
Raphaël Gomès
rust-matchers: add `build_regex_match` function...
r45008 let full_regex = regexps.join(&b'|');
Raphaël Gomès
rust-filepatterns: match exact `rootglob`s with a `HashSet`, not in the regex...
r45311 // An empty pattern would cause the regex engine to incorrectly match the
// (empty) root directory
let func = if !(regexps.is_empty()) {
let matcher = re_matcher(&full_regex)?;
let func = move |filename: &HgPath| {
Raphaël Gomès
rust: create wrapper struct to reduce `regex` contention issues...
r50476 exact_set.contains(filename) || matcher.is_match(filename)
Raphaël Gomès
rust-filepatterns: match exact `rootglob`s with a `HashSet`, not in the regex...
r45311 };
Arseniy Alekseyev
rhg: refactor to use IgnoreFnType alias more widely...
r49177 Box::new(func) as IgnoreFnType
Raphaël Gomès
rust-filepatterns: match exact `rootglob`s with a `HashSet`, not in the regex...
r45311 } else {
let func = move |filename: &HgPath| exact_set.contains(filename);
Arseniy Alekseyev
rhg: refactor to use IgnoreFnType alias more widely...
r49177 Box::new(func) as IgnoreFnType
Raphaël Gomès
rust-filepatterns: match exact `rootglob`s with a `HashSet`, not in the regex...
r45311 };
Raphaël Gomès
rust-matchers: add `build_regex_match` function...
r45008
Ok((full_regex, func))
}
Raphaël Gomès
rust-matchers: add functions to get roots, dirs and parents from patterns...
r45007 /// Returns roots and directories corresponding to each pattern.
///
/// This calculates the roots and directories exactly matching the patterns and
/// returns a tuple of (roots, dirs). It does not return other directories
/// which may also need to be considered, like the parent directories.
fn roots_and_dirs(
ignore_patterns: &[IgnorePattern],
) -> (Vec<HgPathBuf>, Vec<HgPathBuf>) {
let mut roots = Vec::new();
let mut dirs = Vec::new();
for ignore_pattern in ignore_patterns {
let IgnorePattern {
syntax, pattern, ..
} = ignore_pattern;
match syntax {
PatternSyntax::RootGlob | PatternSyntax::Glob => {
Arseniy Alekseyev
rhg: more efficient `HgPath::join`...
r49132 let mut root = HgPathBuf::new();
Raphaël Gomès
rust-matchers: add functions to get roots, dirs and parents from patterns...
r45007 for p in pattern.split(|c| *c == b'/') {
Raphaël Gomès
rust-clippy: fix most warnings in `hg-core`...
r50825 if p.iter()
.any(|c| matches!(*c, b'[' | b'{' | b'*' | b'?'))
{
Raphaël Gomès
rust-matchers: add functions to get roots, dirs and parents from patterns...
r45007 break;
}
Arseniy Alekseyev
rhg: more efficient `HgPath::join`...
r49132 root.push(HgPathBuf::from_bytes(p).as_ref());
Raphaël Gomès
rust-matchers: add functions to get roots, dirs and parents from patterns...
r45007 }
Arseniy Alekseyev
rhg: more efficient `HgPath::join`...
r49132 roots.push(root);
Raphaël Gomès
rust-matchers: add functions to get roots, dirs and parents from patterns...
r45007 }
Raphaël Gomès
match: add `filepath:` pattern to match an exact filepath relative to the root...
r51588 PatternSyntax::Path
| PatternSyntax::RelPath
| PatternSyntax::FilePath => {
Raphaël Gomès
rust-matchers: add functions to get roots, dirs and parents from patterns...
r45007 let pat = HgPath::new(if pattern == b"." {
&[] as &[u8]
} else {
pattern
});
roots.push(pat.to_owned());
}
Arseniy Alekseyev
match: rename RootFiles to RootFilesIn for more consistency
r52461 PatternSyntax::RootFilesIn => {
Raphaël Gomès
rust-matchers: add functions to get roots, dirs and parents from patterns...
r45007 let pat = if pattern == b"." {
&[] as &[u8]
} else {
pattern
};
dirs.push(HgPathBuf::from_bytes(pat));
}
_ => {
roots.push(HgPathBuf::new());
}
}
}
(roots, dirs)
}
/// Paths extracted from patterns
#[derive(Debug, PartialEq)]
struct RootsDirsAndParents {
/// Directories to match recursively
pub roots: HashSet<HgPathBuf>,
/// Directories to match non-recursively
pub dirs: HashSet<HgPathBuf>,
/// Implicitly required directories to go to items in either roots or dirs
Arseniy Alekseyev
match: fix the rust-side bug in visit_children_set for rootfilesin matchers...
r52463 pub parents: DirsMultiset,
Raphaël Gomès
rust-matchers: add functions to get roots, dirs and parents from patterns...
r45007 }
/// Extract roots, dirs and parents from patterns.
fn roots_dirs_and_parents(
ignore_patterns: &[IgnorePattern],
) -> PatternResult<RootsDirsAndParents> {
let (roots, dirs) = roots_and_dirs(ignore_patterns);
Arseniy Alekseyev
match: fix the rust-side bug in visit_children_set for rootfilesin matchers...
r52463 let mut parents = DirsMultiset::from_manifest(&dirs)?;
Raphaël Gomès
rust-matchers: add functions to get roots, dirs and parents from patterns...
r45007
Arseniy Alekseyev
match: fix the rust-side bug in visit_children_set for rootfilesin matchers...
r52463 for path in &roots {
parents.add_path(path)?
}
Raphaël Gomès
rust-matchers: add functions to get roots, dirs and parents from patterns...
r45007
Ok(RootsDirsAndParents {
roots: HashSet::from_iter(roots),
dirs: HashSet::from_iter(dirs),
parents,
})
}
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 /// Returns a function that checks whether a given file (in the general sense)
/// should be matched.
Raphaël Gomès
rust-clippy: fix most warnings in `hg-core`...
r50825 fn build_match<'a>(
Simon Sapin
rust: Parse "subinclude"d files along the way, not later...
r48170 ignore_patterns: Vec<IgnorePattern>,
Spencer Baugh
rust: de-hardcode glob_suffix...
r51754 glob_suffix: &[u8],
Raphaël Gomès
rust-clippy: fix most warnings in `hg-core`...
r50825 ) -> PatternResult<(Vec<u8>, IgnoreFnType<'a>)> {
let mut match_funcs: Vec<IgnoreFnType<'a>> = vec![];
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 // For debugging and printing
let mut patterns = vec![];
Simon Sapin
rust: Parse "subinclude"d files along the way, not later...
r48170 let (subincludes, ignore_patterns) = filter_subincludes(ignore_patterns)?;
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009
if !subincludes.is_empty() {
// Build prefix-based matcher functions for subincludes
let mut submatchers = FastHashMap::default();
let mut prefixes = vec![];
Simon Sapin
rust: Parse "subinclude"d files along the way, not later...
r48170 for sub_include in subincludes {
let matcher = IncludeMatcher::new(sub_include.included_patterns)?;
let match_fn =
Box::new(move |path: &HgPath| matcher.matches(path));
prefixes.push(sub_include.prefix.clone());
submatchers.insert(sub_include.prefix.clone(), match_fn);
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 }
let match_subinclude = move |filename: &HgPath| {
for prefix in prefixes.iter() {
if let Some(rel) = filename.relative_to(prefix) {
Raphaël Gomès
rust: do a clippy pass...
r45500 if (submatchers[prefix])(rel) {
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 return true;
}
}
}
false
};
match_funcs.push(Box::new(match_subinclude));
}
if !ignore_patterns.is_empty() {
// Either do dumb matching if all patterns are rootfiles, or match
// with a regex.
if ignore_patterns
.iter()
Arseniy Alekseyev
match: rename RootFiles to RootFilesIn for more consistency
r52461 .all(|k| k.syntax == PatternSyntax::RootFilesIn)
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 {
let dirs: HashSet<_> = ignore_patterns
.iter()
.map(|k| k.pattern.to_owned())
.collect();
let mut dirs_vec: Vec<_> = dirs.iter().cloned().collect();
let match_func = move |path: &HgPath| -> bool {
let path = path.as_bytes();
Martin von Zweigbergk
matchers: use correct method for finding index in vector...
r52167 let i = path.iter().rposition(|a| *a == b'/');
let dir = if let Some(i) = i { &path[..i] } else { b"." };
Raphaël Gomès
rust: run a clippy pass with the latest stable version...
r52013 dirs.contains(dir)
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 };
match_funcs.push(Box::new(match_func));
patterns.extend(b"rootfilesin: ");
dirs_vec.sort();
patterns.extend(dirs_vec.escaped_bytes());
} else {
Spencer Baugh
rust: de-hardcode glob_suffix...
r51754 let (new_re, match_func) =
build_regex_match(&ignore_patterns, glob_suffix)?;
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 patterns = new_re;
match_funcs.push(match_func)
}
}
Ok(if match_funcs.len() == 1 {
Simon Sapin
rust: Parse "subinclude"d files along the way, not later...
r48170 (patterns, match_funcs.remove(0))
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 } else {
(
patterns,
Box::new(move |f: &HgPath| -> bool {
match_funcs.iter().any(|match_func| match_func(f))
}),
)
})
}
/// Parses all "ignore" files with their recursive includes and returns a
/// function that checks whether a given file (in the general sense) should be
/// ignored.
Arseniy Alekseyev
rhg: implement the debugignorerhg subcommand...
r49178 pub fn get_ignore_matcher<'a>(
Simon Sapin
dirstate-v2: Store a hash of ignore patterns (.hgignore)...
r48202 mut all_pattern_files: Vec<PathBuf>,
Simon Sapin
rust: Make some file path parameters less generic...
r48169 root_dir: &Path,
Raphaël Gomès
dirstate-v2: hash the source of the ignore patterns as well...
r50453 inspect_pattern_bytes: &mut impl FnMut(&Path, &[u8]),
Arseniy Alekseyev
rhg: implement the debugignorerhg subcommand...
r49178 ) -> PatternResult<(IncludeMatcher<'a>, Vec<PatternFileWarning>)> {
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 let mut all_patterns = vec![];
let mut all_warnings = vec![];
Simon Sapin
dirstate-v2: Store a hash of ignore patterns (.hgignore)...
r48202 // Sort to make the ordering of calls to `inspect_pattern_bytes`
// deterministic even if the ordering of `all_pattern_files` is not (such
// as when a iteration order of a Python dict or Rust HashMap is involved).
// Sort by "string" representation instead of the default by component
// (with a Rust-specific definition of a component)
all_pattern_files
.sort_unstable_by(|a, b| a.as_os_str().cmp(b.as_os_str()));
Simon Sapin
rust: Make some file path parameters less generic...
r48169 for pattern_file in &all_pattern_files {
Simon Sapin
dirstate-v2: Store a hash of ignore patterns (.hgignore)...
r48202 let (patterns, warnings) = get_patterns_from_file(
pattern_file,
root_dir,
inspect_pattern_bytes,
)?;
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009
Raphaël Gomès
rust-status: only involve ignore mechanism when needed...
r45088 all_patterns.extend(patterns.to_owned());
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 all_warnings.extend(warnings);
}
Simon Sapin
rust: Parse "subinclude"d files along the way, not later...
r48170 let matcher = IncludeMatcher::new(all_patterns)?;
Arseniy Alekseyev
rhg: implement the debugignorerhg subcommand...
r49178 Ok((matcher, all_warnings))
}
/// Parses all "ignore" files with their recursive includes and returns a
/// function that checks whether a given file (in the general sense) should be
/// ignored.
pub fn get_ignore_function<'a>(
all_pattern_files: Vec<PathBuf>,
root_dir: &Path,
Raphaël Gomès
dirstate-v2: hash the source of the ignore patterns as well...
r50453 inspect_pattern_bytes: &mut impl FnMut(&Path, &[u8]),
Arseniy Alekseyev
rhg: implement the debugignorerhg subcommand...
r49178 ) -> PatternResult<(IgnoreFnType<'a>, Vec<PatternFileWarning>)> {
let res =
get_ignore_matcher(all_pattern_files, root_dir, inspect_pattern_bytes);
res.map(|(matcher, all_warnings)| {
let res: IgnoreFnType<'a> =
Box::new(move |path: &HgPath| matcher.matches(path));
(res, all_warnings)
})
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 }
impl<'a> IncludeMatcher<'a> {
Simon Sapin
rust: Parse "subinclude"d files along the way, not later...
r48170 pub fn new(ignore_patterns: Vec<IgnorePattern>) -> PatternResult<Self> {
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 let RootsDirsAndParents {
roots,
dirs,
parents,
} = roots_dirs_and_parents(&ignore_patterns)?;
Raphaël Gomès
rust-clippy: fix most warnings in `hg-core`...
r50825 let prefix = ignore_patterns.iter().all(|k| {
matches!(k.syntax, PatternSyntax::Path | PatternSyntax::RelPath)
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 });
Spencer Baugh
rust: de-hardcode glob_suffix...
r51754 let (patterns, match_fn) = build_match(ignore_patterns, b"(?:/|$)")?;
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009
Simon Sapin
rust: Parse "subinclude"d files along the way, not later...
r48170 Ok(Self {
patterns,
match_fn,
prefix,
roots,
dirs,
parents,
})
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 }
fn get_all_parents_children(&self) -> DirsChildrenMultiset {
// TODO cache
let thing = self
.dirs
.iter()
.chain(self.roots.iter())
.chain(self.parents.iter());
Arseniy Alekseyev
match: fix the rust-side bug in visit_children_set for rootfilesin matchers...
r52463 DirsChildrenMultiset::new(thing, Some(self.parents.iter()))
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 }
Arseniy Alekseyev
rhg: implement the debugignorerhg subcommand...
r49178
pub fn debug_get_patterns(&self) -> &[u8] {
self.patterns.as_ref()
}
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 }
impl<'a> Display for IncludeMatcher<'a> {
fn fmt(&self, f: &mut Formatter<'_>) -> Result<(), Error> {
Raphaël Gomès
rust-matchers: add TODO about incomplete `Display` for `IncludeMatcher`...
r45312 // XXX What about exact matches?
// I'm not sure it's worth it to clone the HashSet and keep it
// around just in case someone wants to display the matcher, plus
// it's going to be unreadable after a few entries, but we need to
// inform in this display that exact matches are being used and are
// (on purpose) missing from the `includes`.
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 write!(
f,
"IncludeMatcher(includes='{}')",
String::from_utf8_lossy(&self.patterns.escaped_bytes())
)
}
}
Raphaël Gomès
rust-matchers: implement `visit_children_set` for `FileMatcher`...
r44828 #[cfg(test)]
mod tests {
use super::*;
use pretty_assertions::assert_eq;
Arseniy Alekseyev
tests: add tests and document expectations from visit_children_set in rust...
r52457 use std::collections::BTreeMap;
use std::collections::BTreeSet;
use std::fmt::Debug;
Raphaël Gomès
rust-matchers: add functions to get roots, dirs and parents from patterns...
r45007 use std::path::Path;
#[test]
fn test_roots_and_dirs() {
let pats = vec![
IgnorePattern::new(PatternSyntax::Glob, b"g/h/*", Path::new("")),
IgnorePattern::new(PatternSyntax::Glob, b"g/h", Path::new("")),
IgnorePattern::new(PatternSyntax::Glob, b"g*", Path::new("")),
];
let (roots, dirs) = roots_and_dirs(&pats);
assert_eq!(
roots,
vec!(
HgPathBuf::from_bytes(b"g/h"),
HgPathBuf::from_bytes(b"g/h"),
HgPathBuf::new()
),
);
assert_eq!(dirs, vec!());
}
#[test]
fn test_roots_dirs_and_parents() {
let pats = vec![
IgnorePattern::new(PatternSyntax::Glob, b"g/h/*", Path::new("")),
IgnorePattern::new(PatternSyntax::Glob, b"g/h", Path::new("")),
IgnorePattern::new(PatternSyntax::Glob, b"g*", Path::new("")),
];
let mut roots = HashSet::new();
roots.insert(HgPathBuf::from_bytes(b"g/h"));
roots.insert(HgPathBuf::new());
let dirs = HashSet::new();
Arseniy Alekseyev
match: fix the rust-side bug in visit_children_set for rootfilesin matchers...
r52463 let parents = DirsMultiset::from_manifest(&[
HgPathBuf::from_bytes(b"x"),
HgPathBuf::from_bytes(b"g/x"),
HgPathBuf::from_bytes(b"g/y"),
])
.unwrap();
Raphaël Gomès
rust-matchers: add functions to get roots, dirs and parents from patterns...
r45007
assert_eq!(
roots_dirs_and_parents(&pats).unwrap(),
Raphaël Gomès
rust-status: refactor options into a `StatusOptions` struct...
r45011 RootsDirsAndParents {
roots,
dirs,
parents
}
Raphaël Gomès
rust-matchers: add functions to get roots, dirs and parents from patterns...
r45007 );
}
Raphaël Gomès
rust-matchers: implement `visit_children_set` for `FileMatcher`...
r44828
#[test]
fn test_filematcher_visit_children_set() {
// Visitchildrenset
Raphaël Gomès
rust-matchers: make `Matcher` trait object-safe...
r46182 let files = vec![HgPathBuf::from_bytes(b"dir/subdir/foo.txt")];
Raphaël Gomès
rust: use owned types in `Matcher`...
r50241 let matcher = FileMatcher::new(files).unwrap();
Raphaël Gomès
rust-matchers: implement `visit_children_set` for `FileMatcher`...
r44828
let mut set = HashSet::new();
Raphaël Gomès
rust: use owned types in `Matcher`...
r50241 set.insert(HgPathBuf::from_bytes(b"dir"));
Raphaël Gomès
rust-matchers: implement `visit_children_set` for `FileMatcher`...
r44828 assert_eq!(
matcher.visit_children_set(HgPath::new(b"")),
VisitChildrenSet::Set(set)
);
let mut set = HashSet::new();
Raphaël Gomès
rust: use owned types in `Matcher`...
r50241 set.insert(HgPathBuf::from_bytes(b"subdir"));
Raphaël Gomès
rust-matchers: implement `visit_children_set` for `FileMatcher`...
r44828 assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir")),
VisitChildrenSet::Set(set)
);
let mut set = HashSet::new();
Raphaël Gomès
rust: use owned types in `Matcher`...
r50241 set.insert(HgPathBuf::from_bytes(b"foo.txt"));
Raphaël Gomès
rust-matchers: implement `visit_children_set` for `FileMatcher`...
r44828 assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir")),
VisitChildrenSet::Set(set)
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir/x")),
VisitChildrenSet::Empty
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir/foo.txt")),
VisitChildrenSet::Empty
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"folder")),
VisitChildrenSet::Empty
);
}
#[test]
fn test_filematcher_visit_children_set_files_and_dirs() {
let files = vec![
Raphaël Gomès
rust-matchers: make `Matcher` trait object-safe...
r46182 HgPathBuf::from_bytes(b"rootfile.txt"),
HgPathBuf::from_bytes(b"a/file1.txt"),
HgPathBuf::from_bytes(b"a/b/file2.txt"),
Raphaël Gomès
rust-matchers: implement `visit_children_set` for `FileMatcher`...
r44828 // No file in a/b/c
Raphaël Gomès
rust-matchers: make `Matcher` trait object-safe...
r46182 HgPathBuf::from_bytes(b"a/b/c/d/file4.txt"),
Raphaël Gomès
rust-matchers: implement `visit_children_set` for `FileMatcher`...
r44828 ];
Raphaël Gomès
rust: use owned types in `Matcher`...
r50241 let matcher = FileMatcher::new(files).unwrap();
Raphaël Gomès
rust-matchers: implement `visit_children_set` for `FileMatcher`...
r44828
let mut set = HashSet::new();
Raphaël Gomès
rust: use owned types in `Matcher`...
r50241 set.insert(HgPathBuf::from_bytes(b"a"));
set.insert(HgPathBuf::from_bytes(b"rootfile.txt"));
Raphaël Gomès
rust-matchers: implement `visit_children_set` for `FileMatcher`...
r44828 assert_eq!(
matcher.visit_children_set(HgPath::new(b"")),
VisitChildrenSet::Set(set)
);
let mut set = HashSet::new();
Raphaël Gomès
rust: use owned types in `Matcher`...
r50241 set.insert(HgPathBuf::from_bytes(b"b"));
set.insert(HgPathBuf::from_bytes(b"file1.txt"));
Raphaël Gomès
rust-matchers: implement `visit_children_set` for `FileMatcher`...
r44828 assert_eq!(
matcher.visit_children_set(HgPath::new(b"a")),
VisitChildrenSet::Set(set)
);
let mut set = HashSet::new();
Raphaël Gomès
rust: use owned types in `Matcher`...
r50241 set.insert(HgPathBuf::from_bytes(b"c"));
set.insert(HgPathBuf::from_bytes(b"file2.txt"));
Raphaël Gomès
rust-matchers: implement `visit_children_set` for `FileMatcher`...
r44828 assert_eq!(
matcher.visit_children_set(HgPath::new(b"a/b")),
VisitChildrenSet::Set(set)
);
let mut set = HashSet::new();
Raphaël Gomès
rust: use owned types in `Matcher`...
r50241 set.insert(HgPathBuf::from_bytes(b"d"));
Raphaël Gomès
rust-matchers: implement `visit_children_set` for `FileMatcher`...
r44828 assert_eq!(
matcher.visit_children_set(HgPath::new(b"a/b/c")),
VisitChildrenSet::Set(set)
);
let mut set = HashSet::new();
Raphaël Gomès
rust: use owned types in `Matcher`...
r50241 set.insert(HgPathBuf::from_bytes(b"file4.txt"));
Raphaël Gomès
rust-matchers: implement `visit_children_set` for `FileMatcher`...
r44828 assert_eq!(
matcher.visit_children_set(HgPath::new(b"a/b/c/d")),
VisitChildrenSet::Set(set)
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"a/b/c/d/e")),
VisitChildrenSet::Empty
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"folder")),
VisitChildrenSet::Empty
);
}
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009
#[test]
Spencer Baugh
rust-matchers: add PatternMatcher...
r51758 fn test_patternmatcher() {
// VisitdirPrefix
let m = PatternMatcher::new(vec![IgnorePattern::new(
PatternSyntax::Path,
b"dir/subdir",
Path::new(""),
)])
.unwrap();
assert_eq!(
m.visit_children_set(HgPath::new(b"")),
VisitChildrenSet::This
);
assert_eq!(
m.visit_children_set(HgPath::new(b"dir")),
VisitChildrenSet::This
);
assert_eq!(
m.visit_children_set(HgPath::new(b"dir/subdir")),
VisitChildrenSet::Recursive
);
// OPT: This should probably be Recursive if its parent is?
assert_eq!(
m.visit_children_set(HgPath::new(b"dir/subdir/x")),
VisitChildrenSet::This
);
assert_eq!(
m.visit_children_set(HgPath::new(b"folder")),
VisitChildrenSet::Empty
);
// VisitchildrensetPrefix
let m = PatternMatcher::new(vec![IgnorePattern::new(
PatternSyntax::Path,
b"dir/subdir",
Path::new(""),
)])
.unwrap();
assert_eq!(
m.visit_children_set(HgPath::new(b"")),
VisitChildrenSet::This
);
assert_eq!(
m.visit_children_set(HgPath::new(b"dir")),
VisitChildrenSet::This
);
assert_eq!(
m.visit_children_set(HgPath::new(b"dir/subdir")),
VisitChildrenSet::Recursive
);
// OPT: This should probably be Recursive if its parent is?
assert_eq!(
m.visit_children_set(HgPath::new(b"dir/subdir/x")),
VisitChildrenSet::This
);
assert_eq!(
m.visit_children_set(HgPath::new(b"folder")),
VisitChildrenSet::Empty
);
// VisitdirRootfilesin
let m = PatternMatcher::new(vec![IgnorePattern::new(
Arseniy Alekseyev
match: rename RootFiles to RootFilesIn for more consistency
r52461 PatternSyntax::RootFilesIn,
Spencer Baugh
rust-matchers: add PatternMatcher...
r51758 b"dir/subdir",
Path::new(""),
)])
.unwrap();
assert_eq!(
m.visit_children_set(HgPath::new(b"dir/subdir/x")),
Arseniy Alekseyev
match: fix the rust-side bug in visit_children_set for rootfilesin matchers...
r52463 VisitChildrenSet::This
Spencer Baugh
rust-matchers: add PatternMatcher...
r51758 );
assert_eq!(
m.visit_children_set(HgPath::new(b"folder")),
VisitChildrenSet::Empty
);
assert_eq!(
m.visit_children_set(HgPath::new(b"")),
Arseniy Alekseyev
match: fix the rust-side bug in visit_children_set for rootfilesin matchers...
r52463 VisitChildrenSet::This
Spencer Baugh
rust-matchers: add PatternMatcher...
r51758 );
assert_eq!(
m.visit_children_set(HgPath::new(b"dir")),
Arseniy Alekseyev
match: fix the rust-side bug in visit_children_set for rootfilesin matchers...
r52463 VisitChildrenSet::This
Spencer Baugh
rust-matchers: add PatternMatcher...
r51758 );
assert_eq!(
m.visit_children_set(HgPath::new(b"dir/subdir")),
Arseniy Alekseyev
match: fix the rust-side bug in visit_children_set for rootfilesin matchers...
r52463 VisitChildrenSet::This
Spencer Baugh
rust-matchers: add PatternMatcher...
r51758 );
// VisitchildrensetRootfilesin
let m = PatternMatcher::new(vec![IgnorePattern::new(
Arseniy Alekseyev
match: rename RootFiles to RootFilesIn for more consistency
r52461 PatternSyntax::RootFilesIn,
Spencer Baugh
rust-matchers: add PatternMatcher...
r51758 b"dir/subdir",
Path::new(""),
)])
.unwrap();
assert_eq!(
m.visit_children_set(HgPath::new(b"dir/subdir/x")),
Arseniy Alekseyev
match: fix the rust-side bug in visit_children_set for rootfilesin matchers...
r52463 VisitChildrenSet::This
Spencer Baugh
rust-matchers: add PatternMatcher...
r51758 );
assert_eq!(
m.visit_children_set(HgPath::new(b"folder")),
VisitChildrenSet::Empty
);
// FIXME: These should probably be {'dir'}, {'subdir'} and This,
Arseniy Alekseyev
match: fix the rust-side bug in visit_children_set for rootfilesin matchers...
r52463 // respectively
Spencer Baugh
rust-matchers: add PatternMatcher...
r51758 assert_eq!(
m.visit_children_set(HgPath::new(b"")),
Arseniy Alekseyev
match: fix the rust-side bug in visit_children_set for rootfilesin matchers...
r52463 VisitChildrenSet::This
Spencer Baugh
rust-matchers: add PatternMatcher...
r51758 );
assert_eq!(
m.visit_children_set(HgPath::new(b"dir")),
Arseniy Alekseyev
match: fix the rust-side bug in visit_children_set for rootfilesin matchers...
r52463 VisitChildrenSet::This
Spencer Baugh
rust-matchers: add PatternMatcher...
r51758 );
assert_eq!(
m.visit_children_set(HgPath::new(b"dir/subdir")),
Arseniy Alekseyev
match: fix the rust-side bug in visit_children_set for rootfilesin matchers...
r52463 VisitChildrenSet::This
Spencer Baugh
rust-matchers: add PatternMatcher...
r51758 );
// VisitdirGlob
let m = PatternMatcher::new(vec![IgnorePattern::new(
PatternSyntax::Glob,
b"dir/z*",
Path::new(""),
)])
.unwrap();
assert_eq!(
m.visit_children_set(HgPath::new(b"")),
VisitChildrenSet::This
);
assert_eq!(
m.visit_children_set(HgPath::new(b"dir")),
Arseniy Alekseyev
match: fix the rust-side bug in visit_children_set for rootfilesin matchers...
r52463 VisitChildrenSet::This
Spencer Baugh
rust-matchers: add PatternMatcher...
r51758 );
assert_eq!(
m.visit_children_set(HgPath::new(b"folder")),
VisitChildrenSet::Empty
);
// OPT: these should probably be False.
assert_eq!(
m.visit_children_set(HgPath::new(b"dir/subdir")),
VisitChildrenSet::This
);
assert_eq!(
m.visit_children_set(HgPath::new(b"dir/subdir/x")),
VisitChildrenSet::This
);
// VisitchildrensetGlob
let m = PatternMatcher::new(vec![IgnorePattern::new(
PatternSyntax::Glob,
b"dir/z*",
Path::new(""),
)])
.unwrap();
assert_eq!(
m.visit_children_set(HgPath::new(b"")),
VisitChildrenSet::This
);
assert_eq!(
m.visit_children_set(HgPath::new(b"folder")),
VisitChildrenSet::Empty
);
assert_eq!(
m.visit_children_set(HgPath::new(b"dir")),
Arseniy Alekseyev
match: fix the rust-side bug in visit_children_set for rootfilesin matchers...
r52463 VisitChildrenSet::This
Spencer Baugh
rust-matchers: add PatternMatcher...
r51758 );
// OPT: these should probably be Empty
assert_eq!(
m.visit_children_set(HgPath::new(b"dir/subdir")),
VisitChildrenSet::This
);
assert_eq!(
m.visit_children_set(HgPath::new(b"dir/subdir/x")),
VisitChildrenSet::This
);
// VisitdirFilepath
let m = PatternMatcher::new(vec![IgnorePattern::new(
PatternSyntax::FilePath,
b"dir/z",
Path::new(""),
)])
.unwrap();
assert_eq!(
m.visit_children_set(HgPath::new(b"")),
VisitChildrenSet::This
);
assert_eq!(
m.visit_children_set(HgPath::new(b"dir")),
VisitChildrenSet::This
);
assert_eq!(
m.visit_children_set(HgPath::new(b"folder")),
VisitChildrenSet::Empty
);
assert_eq!(
m.visit_children_set(HgPath::new(b"dir/subdir")),
VisitChildrenSet::Empty
);
assert_eq!(
m.visit_children_set(HgPath::new(b"dir/subdir/x")),
VisitChildrenSet::Empty
);
// VisitchildrensetFilepath
let m = PatternMatcher::new(vec![IgnorePattern::new(
PatternSyntax::FilePath,
b"dir/z",
Path::new(""),
)])
.unwrap();
assert_eq!(
m.visit_children_set(HgPath::new(b"")),
VisitChildrenSet::This
);
assert_eq!(
m.visit_children_set(HgPath::new(b"folder")),
VisitChildrenSet::Empty
);
assert_eq!(
m.visit_children_set(HgPath::new(b"dir")),
VisitChildrenSet::This
);
assert_eq!(
m.visit_children_set(HgPath::new(b"dir/subdir")),
VisitChildrenSet::Empty
);
assert_eq!(
m.visit_children_set(HgPath::new(b"dir/subdir/x")),
VisitChildrenSet::Empty
);
}
#[test]
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 fn test_includematcher() {
// VisitchildrensetPrefix
Simon Sapin
rust: Parse "subinclude"d files along the way, not later...
r48170 let matcher = IncludeMatcher::new(vec![IgnorePattern::new(
PatternSyntax::RelPath,
b"dir/subdir",
Path::new(""),
)])
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 .unwrap();
let mut set = HashSet::new();
Raphaël Gomès
rust: use owned types in `Matcher`...
r50241 set.insert(HgPathBuf::from_bytes(b"dir"));
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 assert_eq!(
matcher.visit_children_set(HgPath::new(b"")),
VisitChildrenSet::Set(set)
);
let mut set = HashSet::new();
Raphaël Gomès
rust: use owned types in `Matcher`...
r50241 set.insert(HgPathBuf::from_bytes(b"subdir"));
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir")),
VisitChildrenSet::Set(set)
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir")),
VisitChildrenSet::Recursive
);
// OPT: This should probably be 'all' if its parent is?
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir/x")),
VisitChildrenSet::This
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"folder")),
VisitChildrenSet::Empty
);
// VisitchildrensetRootfilesin
Simon Sapin
rust: Parse "subinclude"d files along the way, not later...
r48170 let matcher = IncludeMatcher::new(vec![IgnorePattern::new(
Arseniy Alekseyev
match: rename RootFiles to RootFilesIn for more consistency
r52461 PatternSyntax::RootFilesIn,
Simon Sapin
rust: Parse "subinclude"d files along the way, not later...
r48170 b"dir/subdir",
Path::new(""),
)])
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 .unwrap();
let mut set = HashSet::new();
Raphaël Gomès
rust: use owned types in `Matcher`...
r50241 set.insert(HgPathBuf::from_bytes(b"dir"));
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 assert_eq!(
matcher.visit_children_set(HgPath::new(b"")),
VisitChildrenSet::Set(set)
);
let mut set = HashSet::new();
Raphaël Gomès
rust: use owned types in `Matcher`...
r50241 set.insert(HgPathBuf::from_bytes(b"subdir"));
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir")),
VisitChildrenSet::Set(set)
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir")),
VisitChildrenSet::This
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir/x")),
VisitChildrenSet::Empty
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"folder")),
VisitChildrenSet::Empty
);
// VisitchildrensetGlob
Simon Sapin
rust: Parse "subinclude"d files along the way, not later...
r48170 let matcher = IncludeMatcher::new(vec![IgnorePattern::new(
PatternSyntax::Glob,
b"dir/z*",
Path::new(""),
)])
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 .unwrap();
let mut set = HashSet::new();
Raphaël Gomès
rust: use owned types in `Matcher`...
r50241 set.insert(HgPathBuf::from_bytes(b"dir"));
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 assert_eq!(
matcher.visit_children_set(HgPath::new(b"")),
VisitChildrenSet::Set(set)
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"folder")),
VisitChildrenSet::Empty
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir")),
VisitChildrenSet::This
);
// OPT: these should probably be set().
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir")),
VisitChildrenSet::This
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir/x")),
VisitChildrenSet::This
);
Raphaël Gomès
rust-matchers: fix behavior of `IncludeMatcher` with multiple includes...
r50359
Raphaël Gomès
match: add `filepath:` pattern to match an exact filepath relative to the root...
r51588 // VisitchildrensetFilePath
let matcher = IncludeMatcher::new(vec![IgnorePattern::new(
PatternSyntax::FilePath,
b"dir/z",
Path::new(""),
)])
.unwrap();
let mut set = HashSet::new();
set.insert(HgPathBuf::from_bytes(b"dir"));
assert_eq!(
matcher.visit_children_set(HgPath::new(b"")),
VisitChildrenSet::Set(set)
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"folder")),
VisitChildrenSet::Empty
);
let mut set = HashSet::new();
set.insert(HgPathBuf::from_bytes(b"z"));
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir")),
VisitChildrenSet::Set(set)
);
// OPT: these should probably be set().
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir")),
VisitChildrenSet::Empty
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir/x")),
VisitChildrenSet::Empty
);
Raphaël Gomès
rust-matchers: fix behavior of `IncludeMatcher` with multiple includes...
r50359 // Test multiple patterns
let matcher = IncludeMatcher::new(vec![
IgnorePattern::new(PatternSyntax::RelPath, b"foo", Path::new("")),
IgnorePattern::new(PatternSyntax::Glob, b"g*", Path::new("")),
])
.unwrap();
assert_eq!(
matcher.visit_children_set(HgPath::new(b"")),
VisitChildrenSet::This
);
// Test multiple patterns
let matcher = IncludeMatcher::new(vec![IgnorePattern::new(
PatternSyntax::Glob,
b"**/*.exe",
Path::new(""),
)])
.unwrap();
assert_eq!(
matcher.visit_children_set(HgPath::new(b"")),
VisitChildrenSet::This
);
Raphaël Gomès
rust-matchers: add `IgnoreMatcher`...
r45009 }
Raphaël Gomès
rust: add UnionMatcher...
r50243
#[test]
fn test_unionmatcher() {
// Path + Rootfiles
let m1 = IncludeMatcher::new(vec![IgnorePattern::new(
PatternSyntax::RelPath,
b"dir/subdir",
Path::new(""),
)])
.unwrap();
let m2 = IncludeMatcher::new(vec![IgnorePattern::new(
Arseniy Alekseyev
match: rename RootFiles to RootFilesIn for more consistency
r52461 PatternSyntax::RootFilesIn,
Raphaël Gomès
rust: add UnionMatcher...
r50243 b"dir",
Path::new(""),
)])
.unwrap();
let matcher = UnionMatcher::new(vec![Box::new(m1), Box::new(m2)]);
let mut set = HashSet::new();
set.insert(HgPathBuf::from_bytes(b"dir"));
assert_eq!(
matcher.visit_children_set(HgPath::new(b"")),
VisitChildrenSet::Set(set)
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir")),
VisitChildrenSet::This
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir")),
VisitChildrenSet::Recursive
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/foo")),
VisitChildrenSet::Empty
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"folder")),
VisitChildrenSet::Empty
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"folder")),
VisitChildrenSet::Empty
);
// OPT: These next two could be 'all' instead of 'this'.
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir/z")),
VisitChildrenSet::This
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir/x")),
VisitChildrenSet::This
);
// Path + unrelated Path
let m1 = IncludeMatcher::new(vec![IgnorePattern::new(
PatternSyntax::RelPath,
b"dir/subdir",
Path::new(""),
)])
.unwrap();
let m2 = IncludeMatcher::new(vec![IgnorePattern::new(
PatternSyntax::RelPath,
b"folder",
Path::new(""),
)])
.unwrap();
let matcher = UnionMatcher::new(vec![Box::new(m1), Box::new(m2)]);
let mut set = HashSet::new();
set.insert(HgPathBuf::from_bytes(b"folder"));
set.insert(HgPathBuf::from_bytes(b"dir"));
assert_eq!(
matcher.visit_children_set(HgPath::new(b"")),
VisitChildrenSet::Set(set)
);
let mut set = HashSet::new();
set.insert(HgPathBuf::from_bytes(b"subdir"));
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir")),
VisitChildrenSet::Set(set)
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir")),
VisitChildrenSet::Recursive
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/foo")),
VisitChildrenSet::Empty
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"folder")),
VisitChildrenSet::Recursive
);
// OPT: These next two could be 'all' instead of 'this'.
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir/z")),
VisitChildrenSet::This
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir/x")),
VisitChildrenSet::This
);
// Path + subpath
let m1 = IncludeMatcher::new(vec![IgnorePattern::new(
PatternSyntax::RelPath,
b"dir/subdir/x",
Path::new(""),
)])
.unwrap();
let m2 = IncludeMatcher::new(vec![IgnorePattern::new(
PatternSyntax::RelPath,
b"dir/subdir",
Path::new(""),
)])
.unwrap();
let matcher = UnionMatcher::new(vec![Box::new(m1), Box::new(m2)]);
let mut set = HashSet::new();
set.insert(HgPathBuf::from_bytes(b"dir"));
assert_eq!(
matcher.visit_children_set(HgPath::new(b"")),
VisitChildrenSet::Set(set)
);
let mut set = HashSet::new();
set.insert(HgPathBuf::from_bytes(b"subdir"));
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir")),
VisitChildrenSet::Set(set)
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir")),
VisitChildrenSet::Recursive
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/foo")),
VisitChildrenSet::Empty
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"folder")),
VisitChildrenSet::Empty
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir/x")),
VisitChildrenSet::Recursive
);
// OPT: this should probably be 'all' not 'this'.
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir/z")),
VisitChildrenSet::This
);
}
Raphaël Gomès
rust: add IntersectionMatcher...
r50245
#[test]
fn test_intersectionmatcher() {
// Include path + Include rootfiles
let m1 = Box::new(
IncludeMatcher::new(vec![IgnorePattern::new(
PatternSyntax::RelPath,
b"dir/subdir",
Path::new(""),
)])
.unwrap(),
);
let m2 = Box::new(
IncludeMatcher::new(vec![IgnorePattern::new(
Arseniy Alekseyev
match: rename RootFiles to RootFilesIn for more consistency
r52461 PatternSyntax::RootFilesIn,
Raphaël Gomès
rust: add IntersectionMatcher...
r50245 b"dir",
Path::new(""),
)])
.unwrap(),
);
let matcher = IntersectionMatcher::new(m1, m2);
let mut set = HashSet::new();
set.insert(HgPathBuf::from_bytes(b"dir"));
assert_eq!(
matcher.visit_children_set(HgPath::new(b"")),
VisitChildrenSet::Set(set)
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir")),
VisitChildrenSet::This
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir")),
VisitChildrenSet::Empty
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/foo")),
VisitChildrenSet::Empty
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"folder")),
VisitChildrenSet::Empty
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir/z")),
VisitChildrenSet::Empty
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir/x")),
VisitChildrenSet::Empty
);
// Non intersecting paths
let m1 = Box::new(
IncludeMatcher::new(vec![IgnorePattern::new(
PatternSyntax::RelPath,
b"dir/subdir",
Path::new(""),
)])
.unwrap(),
);
let m2 = Box::new(
IncludeMatcher::new(vec![IgnorePattern::new(
PatternSyntax::RelPath,
b"folder",
Path::new(""),
)])
.unwrap(),
);
let matcher = IntersectionMatcher::new(m1, m2);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"")),
VisitChildrenSet::Empty
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir")),
VisitChildrenSet::Empty
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir")),
VisitChildrenSet::Empty
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/foo")),
VisitChildrenSet::Empty
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"folder")),
VisitChildrenSet::Empty
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir/z")),
VisitChildrenSet::Empty
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir/x")),
VisitChildrenSet::Empty
);
// Nested paths
let m1 = Box::new(
IncludeMatcher::new(vec![IgnorePattern::new(
PatternSyntax::RelPath,
b"dir/subdir/x",
Path::new(""),
)])
.unwrap(),
);
let m2 = Box::new(
IncludeMatcher::new(vec![IgnorePattern::new(
PatternSyntax::RelPath,
b"dir/subdir",
Path::new(""),
)])
.unwrap(),
);
let matcher = IntersectionMatcher::new(m1, m2);
let mut set = HashSet::new();
set.insert(HgPathBuf::from_bytes(b"dir"));
assert_eq!(
matcher.visit_children_set(HgPath::new(b"")),
VisitChildrenSet::Set(set)
);
let mut set = HashSet::new();
set.insert(HgPathBuf::from_bytes(b"subdir"));
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir")),
VisitChildrenSet::Set(set)
);
let mut set = HashSet::new();
set.insert(HgPathBuf::from_bytes(b"x"));
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir")),
VisitChildrenSet::Set(set)
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/foo")),
VisitChildrenSet::Empty
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"folder")),
VisitChildrenSet::Empty
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir/z")),
VisitChildrenSet::Empty
);
// OPT: this should probably be 'all' not 'this'.
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir/x")),
VisitChildrenSet::This
);
// Diverging paths
let m1 = Box::new(
IncludeMatcher::new(vec![IgnorePattern::new(
PatternSyntax::RelPath,
b"dir/subdir/x",
Path::new(""),
)])
.unwrap(),
);
let m2 = Box::new(
IncludeMatcher::new(vec![IgnorePattern::new(
PatternSyntax::RelPath,
b"dir/subdir/z",
Path::new(""),
)])
.unwrap(),
);
let matcher = IntersectionMatcher::new(m1, m2);
// OPT: these next two could probably be Empty as well.
let mut set = HashSet::new();
set.insert(HgPathBuf::from_bytes(b"dir"));
assert_eq!(
matcher.visit_children_set(HgPath::new(b"")),
VisitChildrenSet::Set(set)
);
// OPT: these next two could probably be Empty as well.
let mut set = HashSet::new();
set.insert(HgPathBuf::from_bytes(b"subdir"));
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir")),
VisitChildrenSet::Set(set)
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir")),
VisitChildrenSet::Empty
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/foo")),
VisitChildrenSet::Empty
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"folder")),
VisitChildrenSet::Empty
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir/z")),
VisitChildrenSet::Empty
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir/x")),
VisitChildrenSet::Empty
);
}
Raphaël Gomès
rust-matchers: implement DifferenceMatcher...
r50373
#[test]
fn test_differencematcher() {
// Two alwaysmatchers should function like a nevermatcher
let m1 = AlwaysMatcher;
let m2 = AlwaysMatcher;
let matcher = DifferenceMatcher::new(Box::new(m1), Box::new(m2));
for case in &[
&b""[..],
b"dir",
b"dir/subdir",
b"dir/subdir/z",
b"dir/foo",
b"dir/subdir/x",
b"folder",
] {
assert_eq!(
matcher.visit_children_set(HgPath::new(case)),
VisitChildrenSet::Empty
);
}
// One always and one never should behave the same as an always
let m1 = AlwaysMatcher;
let m2 = NeverMatcher;
let matcher = DifferenceMatcher::new(Box::new(m1), Box::new(m2));
for case in &[
&b""[..],
b"dir",
b"dir/subdir",
b"dir/subdir/z",
b"dir/foo",
b"dir/subdir/x",
b"folder",
] {
assert_eq!(
matcher.visit_children_set(HgPath::new(case)),
VisitChildrenSet::Recursive
);
}
// Two include matchers
let m1 = Box::new(
IncludeMatcher::new(vec![IgnorePattern::new(
PatternSyntax::RelPath,
b"dir/subdir",
Path::new("/repo"),
)])
.unwrap(),
);
let m2 = Box::new(
IncludeMatcher::new(vec![IgnorePattern::new(
Arseniy Alekseyev
match: rename RootFiles to RootFilesIn for more consistency
r52461 PatternSyntax::RootFilesIn,
Raphaël Gomès
rust-matchers: implement DifferenceMatcher...
r50373 b"dir",
Path::new("/repo"),
)])
.unwrap(),
);
let matcher = DifferenceMatcher::new(m1, m2);
let mut set = HashSet::new();
set.insert(HgPathBuf::from_bytes(b"dir"));
assert_eq!(
matcher.visit_children_set(HgPath::new(b"")),
VisitChildrenSet::Set(set)
);
let mut set = HashSet::new();
set.insert(HgPathBuf::from_bytes(b"subdir"));
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir")),
VisitChildrenSet::Set(set)
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir")),
VisitChildrenSet::Recursive
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/foo")),
VisitChildrenSet::Empty
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"folder")),
VisitChildrenSet::Empty
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir/z")),
VisitChildrenSet::This
);
assert_eq!(
matcher.visit_children_set(HgPath::new(b"dir/subdir/x")),
VisitChildrenSet::This
);
}
Arseniy Alekseyev
tests: add tests and document expectations from visit_children_set in rust...
r52457
mod invariants {
pub mod visit_children_set {
use crate::{
matchers::{tests::Tree, Matcher, VisitChildrenSet},
utils::hg_path::HgPath,
};
#[allow(dead_code)]
#[derive(Debug)]
struct Error<'a, M> {
matcher: &'a M,
path: &'a HgPath,
matching: &'a Tree,
visit_children_set: &'a VisitChildrenSet,
}
Arseniy Alekseyev
match: strengthen visit_children_set invariant, Recursive means "all files"...
r52464 fn holds(
matching: &Tree,
not_matching: &Tree,
vcs: &VisitChildrenSet,
) -> bool {
Arseniy Alekseyev
tests: add tests and document expectations from visit_children_set in rust...
r52457 match vcs {
VisitChildrenSet::Empty => matching.is_empty(),
VisitChildrenSet::This => {
// `This` does not come with any obligations.
true
}
VisitChildrenSet::Recursive => {
Arseniy Alekseyev
match: strengthen visit_children_set invariant, Recursive means "all files"...
r52464 // `Recursive` requires that *everything* in the
// subtree matches. This
// requirement is relied on for example in
// DifferenceMatcher implementation.
not_matching.is_empty()
Arseniy Alekseyev
tests: add tests and document expectations from visit_children_set in rust...
r52457 }
VisitChildrenSet::Set(allowed_children) => {
// `allowed_children` does not distinguish between
// files and directories: if it's not included, it
// must not be matched.
for k in matching.dirs.keys() {
if !(allowed_children.contains(k)) {
return false;
}
}
for k in matching.files.iter() {
if !(allowed_children.contains(k)) {
return false;
}
}
true
}
}
}
pub fn check<M: Matcher + std::fmt::Debug>(
matcher: &M,
path: &HgPath,
matching: &Tree,
Arseniy Alekseyev
match: strengthen visit_children_set invariant, Recursive means "all files"...
r52464 not_matching: &Tree,
Arseniy Alekseyev
tests: add tests and document expectations from visit_children_set in rust...
r52457 visit_children_set: &VisitChildrenSet,
) {
Arseniy Alekseyev
match: strengthen visit_children_set invariant, Recursive means "all files"...
r52464 if !holds(matching, not_matching, visit_children_set) {
Arseniy Alekseyev
tests: add tests and document expectations from visit_children_set in rust...
r52457 panic!(
"{:#?}",
Error {
matcher,
path,
visit_children_set,
matching
}
)
}
}
}
}
#[derive(Debug, Clone)]
pub struct Tree {
files: BTreeSet<HgPathBuf>,
dirs: BTreeMap<HgPathBuf, Tree>,
}
impl Tree {
fn len(&self) -> usize {
let mut n = 0;
n += self.files.len();
for d in self.dirs.values() {
n += d.len();
}
n
}
fn is_empty(&self) -> bool {
self.files.is_empty() && self.dirs.is_empty()
}
Arseniy Alekseyev
match: strengthen visit_children_set invariant, Recursive means "all files"...
r52464 fn make(
files: BTreeSet<HgPathBuf>,
dirs: BTreeMap<HgPathBuf, Tree>,
) -> Self {
Self {
files,
dirs: dirs
.into_iter()
.filter(|(_k, v)| (!(v.is_empty())))
.collect(),
}
}
Arseniy Alekseyev
tests: add tests and document expectations from visit_children_set in rust...
r52457 fn filter_and_check<M: Matcher + Debug>(
&self,
m: &M,
path: &HgPath,
Arseniy Alekseyev
match: strengthen visit_children_set invariant, Recursive means "all files"...
r52464 ) -> (Self, Self) {
let (files1, files2): (BTreeSet<HgPathBuf>, BTreeSet<HgPathBuf>) =
self.files
.iter()
.map(|v| v.to_owned())
.partition(|v| m.matches(&path.join(v)));
let (dirs1, dirs2): (
BTreeMap<HgPathBuf, Tree>,
BTreeMap<HgPathBuf, Tree>,
) = self
Arseniy Alekseyev
tests: add tests and document expectations from visit_children_set in rust...
r52457 .dirs
.iter()
Arseniy Alekseyev
match: strengthen visit_children_set invariant, Recursive means "all files"...
r52464 .map(|(k, v)| {
Arseniy Alekseyev
tests: add tests and document expectations from visit_children_set in rust...
r52457 let path = path.join(k);
Arseniy Alekseyev
match: strengthen visit_children_set invariant, Recursive means "all files"...
r52464 let (t1, t2) = v.filter_and_check(m, &path);
((k.clone(), t1), (k.clone(), t2))
Arseniy Alekseyev
tests: add tests and document expectations from visit_children_set in rust...
r52457 })
Arseniy Alekseyev
match: strengthen visit_children_set invariant, Recursive means "all files"...
r52464 .unzip();
let matching = Self::make(files1, dirs1);
let not_matching = Self::make(files2, dirs2);
Arseniy Alekseyev
tests: add tests and document expectations from visit_children_set in rust...
r52457 let vcs = m.visit_children_set(path);
Arseniy Alekseyev
match: strengthen visit_children_set invariant, Recursive means "all files"...
r52464 invariants::visit_children_set::check(
m,
path,
&matching,
&not_matching,
&vcs,
);
(matching, not_matching)
Arseniy Alekseyev
tests: add tests and document expectations from visit_children_set in rust...
r52457 }
fn check_matcher<M: Matcher + Debug>(
&self,
m: &M,
expect_count: usize,
) {
let res = self.filter_and_check(m, &HgPathBuf::new());
Arseniy Alekseyev
match: strengthen visit_children_set invariant, Recursive means "all files"...
r52464 if expect_count != res.0.len() {
Arseniy Alekseyev
tests: add tests and document expectations from visit_children_set in rust...
r52457 eprintln!(
"warning: expected {} matches, got {} for {:#?}",
expect_count,
Arseniy Alekseyev
match: strengthen visit_children_set invariant, Recursive means "all files"...
r52464 res.0.len(),
Arseniy Alekseyev
tests: add tests and document expectations from visit_children_set in rust...
r52457 m
);
}
}
}
fn mkdir(children: &[(&[u8], &Tree)]) -> Tree {
let p = HgPathBuf::from_bytes;
let names = [
p(b"a"),
p(b"b.txt"),
p(b"file.txt"),
p(b"c.c"),
p(b"c.h"),
p(b"dir1"),
p(b"dir2"),
p(b"subdir"),
];
let files: BTreeSet<HgPathBuf> = BTreeSet::from(names);
let dirs = children
.iter()
.map(|(name, t)| (p(name), (*t).clone()))
.collect();
Tree { files, dirs }
}
fn make_example_tree() -> Tree {
let leaf = mkdir(&[]);
let abc = mkdir(&[(b"d", &leaf)]);
let ab = mkdir(&[(b"c", &abc)]);
let a = mkdir(&[(b"b", &ab)]);
let dir = mkdir(&[(b"subdir", &leaf), (b"subdir.c", &leaf)]);
mkdir(&[(b"dir", &dir), (b"dir1", &dir), (b"dir2", &dir), (b"a", &a)])
}
#[test]
fn test_pattern_matcher_visit_children_set() {
let tree = make_example_tree();
Arseniy Alekseyev
matchers: fix the bug in rust PatternMatcher that made it cut off early...
r52459 let pattern_dir1_glob_c =
Arseniy Alekseyev
tests: add tests and document expectations from visit_children_set in rust...
r52457 PatternMatcher::new(vec![IgnorePattern::new(
PatternSyntax::Glob,
b"dir1/*.c",
Path::new(""),
)])
.unwrap();
let pattern_dir1 = || {
PatternMatcher::new(vec![IgnorePattern::new(
PatternSyntax::Path,
b"dir1",
Path::new(""),
)])
.unwrap()
};
let pattern_dir1_a = PatternMatcher::new(vec![IgnorePattern::new(
PatternSyntax::Glob,
b"dir1/a",
Path::new(""),
)])
.unwrap();
let pattern_relglob_c = || {
PatternMatcher::new(vec![IgnorePattern::new(
PatternSyntax::RelGlob,
b"*.c",
Path::new(""),
)])
.unwrap()
};
let files = vec![HgPathBuf::from_bytes(b"dir/subdir/b.txt")];
let file_dir_subdir_b = FileMatcher::new(files).unwrap();
let files = vec![
HgPathBuf::from_bytes(b"file.txt"),
HgPathBuf::from_bytes(b"a/file.txt"),
HgPathBuf::from_bytes(b"a/b/file.txt"),
// No file in a/b/c
HgPathBuf::from_bytes(b"a/b/c/d/file.txt"),
];
let file_abcdfile = FileMatcher::new(files).unwrap();
Arseniy Alekseyev
match: fix the rust-side bug in visit_children_set for rootfilesin matchers...
r52463 let rootfilesin_dir = PatternMatcher::new(vec![IgnorePattern::new(
Arseniy Alekseyev
match: rename RootFiles to RootFilesIn for more consistency
r52461 PatternSyntax::RootFilesIn,
Arseniy Alekseyev
tests: add tests and document expectations from visit_children_set in rust...
r52457 b"dir",
Path::new(""),
)])
.unwrap();
let pattern_filepath_dir_subdir =
PatternMatcher::new(vec![IgnorePattern::new(
PatternSyntax::FilePath,
b"dir/subdir",
Path::new(""),
)])
.unwrap();
let include_dir_subdir =
IncludeMatcher::new(vec![IgnorePattern::new(
PatternSyntax::RelPath,
b"dir/subdir",
Path::new(""),
)])
.unwrap();
let more_includematchers = [
IncludeMatcher::new(vec![IgnorePattern::new(
PatternSyntax::Glob,
b"dir/s*",
Path::new(""),
)])
.unwrap(),
// Test multiple patterns
IncludeMatcher::new(vec![
IgnorePattern::new(
PatternSyntax::RelPath,
b"dir",
Path::new(""),
),
IgnorePattern::new(PatternSyntax::Glob, b"s*", Path::new("")),
])
.unwrap(),
// Test multiple patterns
IncludeMatcher::new(vec![IgnorePattern::new(
PatternSyntax::Glob,
b"**/*.c",
Path::new(""),
)])
.unwrap(),
];
tree.check_matcher(&pattern_dir1(), 25);
tree.check_matcher(&pattern_dir1_a, 1);
Arseniy Alekseyev
matchers: fix the bug in rust PatternMatcher that made it cut off early...
r52459 tree.check_matcher(&pattern_dir1_glob_c, 2);
Arseniy Alekseyev
tests: add tests and document expectations from visit_children_set in rust...
r52457 tree.check_matcher(&pattern_relglob_c(), 14);
tree.check_matcher(&AlwaysMatcher, 112);
tree.check_matcher(&NeverMatcher, 0);
tree.check_matcher(
&IntersectionMatcher::new(
Box::new(pattern_relglob_c()),
Box::new(pattern_dir1()),
),
3,
);
tree.check_matcher(
&UnionMatcher::new(vec![
Box::new(pattern_relglob_c()),
Box::new(pattern_dir1()),
]),
36,
);
tree.check_matcher(
&DifferenceMatcher::new(
Box::new(pattern_relglob_c()),
Box::new(pattern_dir1()),
),
11,
);
tree.check_matcher(&file_dir_subdir_b, 1);
tree.check_matcher(&file_abcdfile, 4);
Arseniy Alekseyev
match: fix the rust-side bug in visit_children_set for rootfilesin matchers...
r52463 tree.check_matcher(&rootfilesin_dir, 8);
Arseniy Alekseyev
tests: add tests and document expectations from visit_children_set in rust...
r52457 tree.check_matcher(&pattern_filepath_dir_subdir, 1);
tree.check_matcher(&include_dir_subdir, 9);
tree.check_matcher(&more_includematchers[0], 17);
tree.check_matcher(&more_includematchers[1], 25);
tree.check_matcher(&more_includematchers[2], 35);
}
Raphaël Gomès
rust-matchers: implement `visit_children_set` for `FileMatcher`...
r44828 }