upstream/mercurial-mirror Commit - r42978:0def0fcb

rust-docstrings: add missing module docstrings...

Raphaël Gomès -

r42978:0def0fcb default

parent child

rust/hg-core/src/filepatterns.rs

0 +9 0

+            // filepatterns.rs
+            //
+            // Copyright 2019 Raphaël Gomès <rgomes@octobus.net>
+            //
+            // This software may be used and distributed according to the terms of the
+            // GNU General Public License version 2 or any later version.
+            //! Handling of Mercurial-specific patterns.
             use crate::{
                 utils::{files::get_path_from_bytes, SliceExt},
                 LineNumber, PatternError, PatternFileError,
             };
             use lazy_static::lazy_static;
             use regex::bytes::{NoExpand, Regex};
             use std::collections::HashMap;
             use std::fs::File;
             use std::io::Read;
             use std::vec::Vec;
             lazy_static! {
                 static ref RE_ESCAPE: Vec<Vec<u8>> = {
                     let mut v: Vec<Vec<u8>> = (0..=255).map(|byte| vec![byte]).collect();
                     let to_escape = b"()[]{}?*+-|^$\\.&~# \t\n\r\x0b\x0c";
                     for byte in to_escape {
                         v[*byte as usize].insert(0, b'\\');
                     }
                     v
                 };
             }
             /// These are matched in order
             const GLOB_REPLACEMENTS: &[(&[u8], &[u8])] =
                 &[(b"*/", b"(?:.*/)?"), (b"*", b".*"), (b"", b"[^/]*")];
             #[derive(Debug, Copy, Clone, PartialEq, Eq)]
             pub enum PatternSyntax {
                 Regexp,
                 /// Glob that matches at the front of the path
                 RootGlob,
                 /// Glob that matches at any suffix of the path (still anchored at slashes)
                 Glob,
                 Path,
                 RelPath,
                 RelGlob,
                 RelRegexp,
                 RootFiles,
             }
             /// Transforms a glob pattern into a regex
             fn glob_to_re(pat: &[u8]) -> Vec<u8> {
                 let mut input = pat;
                 let mut res: Vec<u8> = vec![];
                 let mut group_depth = 0;
                 while let Some((c, rest)) = input.split_first() {
                     input = rest;
                     match c {
                         b'*' => {
                             for (source, repl) in GLOB_REPLACEMENTS {
                                 if input.starts_with(source) {
                                     input = &input[source.len()..];
                                     res.extend(*repl);
                                     break;
                                 }
                             }
                         }
                         b'?' => res.extend(b"."),
                         b'[' => {
                             match input.iter().skip(1).position(|b| *b == b']') {
                                 None => res.extend(b"\\["),
                                 Some(end) => {
                                     // Account for the one we skipped
                                     let end = end + 1;
                                     res.extend(b"[");
                                     for (i, b) in input[..end].iter().enumerate() {
                                         if *b == b'!' && i == 0 {
                                             res.extend(b"^")
                                         } else if *b == b'^' && i == 0 {
                                             res.extend(b"\\^")
                                         } else if *b == b'\\' {
                                             res.extend(b"\\\\")
                                         } else {
                                             res.push(*b)
                                         }
                                     }
                                     res.extend(b"]");
                                     input = &input[end + 1..];
                                 }
                             }
                         }
                         b'{' => {
                             group_depth += 1;
                             res.extend(b"(?:")
                         }
                         b'}' if group_depth > 0 => {
                             group_depth -= 1;
                             res.extend(b")");
                         }
                         b',' if group_depth > 0 => res.extend(b"|"),
                         b'\\' => {
                             let c = {
                                 if let Some((c, rest)) = input.split_first() {
                                     input = rest;
                                     c
                                 } else {
                                     c
                                 }
                             };
                             res.extend(&RE_ESCAPE[*c as usize])
                         }
                         _ => res.extend(&RE_ESCAPE[*c as usize]),
                     }
                 }
                 res
             }
             fn escape_pattern(pattern: &[u8]) -> Vec<u8> {
                 pattern
                     .iter()
                     .flat_map(|c| RE_ESCAPE[*c as usize].clone())
                     .collect()
             }
             fn parse_pattern_syntax(kind: &[u8]) -> Result<PatternSyntax, PatternError> {
                 match kind {
                     b"re" => Ok(PatternSyntax::Regexp),
                     b"path" => Ok(PatternSyntax::Path),
                     b"relpath" => Ok(PatternSyntax::RelPath),
                     b"rootfilesin" => Ok(PatternSyntax::RootFiles),
                     b"relglob" => Ok(PatternSyntax::RelGlob),
                     b"relre" => Ok(PatternSyntax::RelRegexp),
                     b"glob" => Ok(PatternSyntax::Glob),
                     b"rootglob" => Ok(PatternSyntax::RootGlob),
                     _ => Err(PatternError::UnsupportedSyntax(
                         String::from_utf8_lossy(kind).to_string(),
                     )),
                 }
             }
             /// Builds the regex that corresponds to the given pattern.
             /// If within a `syntax: regexp` context, returns the pattern,
             /// otherwise, returns the corresponding regex.
             fn _build_single_regex(
                 syntax: PatternSyntax,
                 pattern: &[u8],
                 globsuffix: &[u8],
             ) -> Vec<u8> {
                 if pattern.is_empty() {
                     return vec![];
                 }
                 match syntax {
                     PatternSyntax::Regexp => pattern.to_owned(),
                     PatternSyntax::RelRegexp => {
                         if pattern[0] == b'^' {
                             return pattern.to_owned();
                         }
                         let mut res = b".*".to_vec();
                         res.extend(pattern);
                         res
                     }
                     PatternSyntax::Path | PatternSyntax::RelPath => {
                         if pattern == b"." {
                             return vec![];
                         }
                         let mut pattern = escape_pattern(pattern);
                         pattern.extend(b"(?:/|$)");
                         pattern
                     }
                     PatternSyntax::RootFiles => {
                         let mut res = if pattern == b"." {
                             vec![]
                         } else {
                             // Pattern is a directory name.
                             let mut as_vec: Vec<u8> = escape_pattern(pattern);
                             as_vec.push(b'/');
                             as_vec
                         };
                         // Anything after the pattern must be a non-directory.
                         res.extend(b"[^/]+$");
                         res
                     }
                     PatternSyntax::Glob
                     | PatternSyntax::RelGlob
                     | PatternSyntax::RootGlob => {
                         let mut res: Vec<u8> = vec![];
                         if syntax == PatternSyntax::RelGlob {
                             res.extend(b"(?:|.*/)");
                         }
                         res.extend(glob_to_re(pattern));
                         res.extend(globsuffix.iter());
                         res
                     }
                 }
             }
             const GLOB_SPECIAL_CHARACTERS: [u8; 7] =
                 [b'*', b'?', b'[', b']', b'{', b'}', b'\\'];
             /// Wrapper function to `_build_single_regex` that short-circuits 'exact' globs
             /// that don't need to be transformed into a regex.
             pub fn build_single_regex(
                 kind: &[u8],
                 pat: &[u8],
                 globsuffix: &[u8],
             ) -> Result<Vec<u8>, PatternError> {
                 let enum_kind = parse_pattern_syntax(kind)?;
                 if enum_kind == PatternSyntax::RootGlob
                     && !pat.iter().any(|b| GLOB_SPECIAL_CHARACTERS.contains(b))
                 {
                     let mut escaped = escape_pattern(pat);
                     escaped.extend(b"(?:/|$)");
                     Ok(escaped)
                 } else {
                     Ok(_build_single_regex(enum_kind, pat, globsuffix))
                 }
             }
             lazy_static! {
                 static ref SYNTAXES: HashMap<&'static [u8], &'static [u8]> = {
                     let mut m = HashMap::new();
                     m.insert(b"re".as_ref(), b"relre:".as_ref());
                     m.insert(b"regexp".as_ref(), b"relre:".as_ref());
                     m.insert(b"glob".as_ref(), b"relglob:".as_ref());
                     m.insert(b"rootglob".as_ref(), b"rootglob:".as_ref());
                     m.insert(b"include".as_ref(), b"include".as_ref());
                     m.insert(b"subinclude".as_ref(), b"subinclude".as_ref());
                     m
                 };
             }
             pub type PatternTuple = (Vec<u8>, LineNumber, Vec<u8>);
             type WarningTuple = (Vec<u8>, Vec<u8>);
             pub fn parse_pattern_file_contents(
                 lines: &[u8],
                 file_path: &[u8],
                 warn: bool,
             ) -> (Vec<PatternTuple>, Vec<WarningTuple>) {
                 let comment_regex = Regex::new(r"((?:^|[^\\])(?:\\\\)*)#.*").unwrap();
                 let comment_escape_regex = Regex::new(r"\\#").unwrap();
                 let mut inputs: Vec<PatternTuple> = vec![];
                 let mut warnings: Vec<WarningTuple> = vec![];
                 let mut current_syntax = b"relre:".as_ref();
                 for (line_number, mut line) in lines.split(|c| *c == b'\n').enumerate() {
                     let line_number = line_number + 1;
                     let line_buf;
                     if line.contains(&b'#') {
                         if let Some(cap) = comment_regex.captures(line) {
                             line = &line[..cap.get(1).unwrap().end()]
                         }
                         line_buf = comment_escape_regex.replace_all(line, NoExpand(b"#"));
                         line = &line_buf;
                     }
                     let mut line = line.trim_end();
                     if line.is_empty() {
                         continue;
                     }
                     if line.starts_with(b"syntax:") {
                         let syntax = line[b"syntax:".len()..].trim();
                         if let Some(rel_syntax) = SYNTAXES.get(syntax) {
                             current_syntax = rel_syntax;
                         } else if warn {
                             warnings.push((file_path.to_owned(), syntax.to_owned()));
                         }
                         continue;
                     }
                     let mut line_syntax: &[u8] = &current_syntax;
                     for (s, rels) in SYNTAXES.iter() {
                         if line.starts_with(rels) {
                             line_syntax = rels;
                             line = &line[rels.len()..];
                             break;
                         } else if line.starts_with(&[s, b":".as_ref()].concat()) {
                             line_syntax = rels;
                             line = &line[s.len() + 1..];
                             break;
                         }
                     }
                     inputs.push((
                         [line_syntax, line].concat(),
                         line_number,
                         line.to_owned(),
                     ));
                 }
                 (inputs, warnings)
             }
             pub fn read_pattern_file(
                 file_path: &[u8],
                 warn: bool,
             ) -> Result<(Vec<PatternTuple>, Vec<WarningTuple>), PatternFileError> {
                 let mut f = File::open(get_path_from_bytes(file_path))?;
                 let mut contents = Vec::new();
                 f.read_to_end(&mut contents)?;
                 Ok(parse_pattern_file_contents(&contents, file_path, warn))
             }
             #[cfg(test)]
             mod tests {
                 use super::*;
                 #[test]
                 fn escape_pattern_test() {
                     let untouched = br#"!"%',/0123456789:;<=>@ABCDEFGHIJKLMNOPQRSTUVWXYZ_`abcdefghijklmnopqrstuvwxyz"#;
                     assert_eq!(escape_pattern(untouched), untouched.to_vec());
                     // All escape codes
                     assert_eq!(
                         escape_pattern(br#"()[]{}?*+-|^$\\.&~# \t\n\r\v\f"#),
                         br#"\(\)\[\]\{\}\?\*\+\-\|\^\$\\\\\.\&\~\#\ \\t\\n\\r\\v\\f"#
                             .to_vec()
                     );
                 }
                 #[test]
                 fn glob_test() {
                     assert_eq!(glob_to_re(br#"?"#), br#"."#);
                     assert_eq!(glob_to_re(br#"*"#), br#"[^/]*"#);
                     assert_eq!(glob_to_re(br#"**"#), br#".*"#);
                     assert_eq!(glob_to_re(br#"**/a"#), br#"(?:.*/)?a"#);
                     assert_eq!(glob_to_re(br#"a/**/b"#), br#"a/(?:.*/)?b"#);
                     assert_eq!(glob_to_re(br#"[a*?!^][^b][!c]"#), br#"[a*?!^][\^b][^c]"#);
                     assert_eq!(glob_to_re(br#"{a,b}"#), br#"(?:a|b)"#);
                     assert_eq!(glob_to_re(br#".\*\?"#), br#"\.\*\?"#);
                 }
                 #[test]
                 fn test_parse_pattern_file_contents() {
                     let lines = b"syntax: glob\n*.elc";
                     assert_eq!(
                         vec![(b"relglob:*.elc".to_vec(), 2, b"*.elc".to_vec())],
                         parse_pattern_file_contents(lines, b"file_path", false).0,
                     );
                     let lines = b"syntax: include\nsyntax: glob";
                     assert_eq!(
                         parse_pattern_file_contents(lines, b"file_path", false).0,
                         vec![]
                     );
                     let lines = b"glob:**.o";
                     assert_eq!(
                         parse_pattern_file_contents(lines, b"file_path", false).0,
                         vec![(b"relglob:**.o".to_vec(), 1, b"**.o".to_vec())]
                     );
                 }
                 #[test]
                 fn test_build_single_regex_shortcut() {
                     assert_eq!(
                         br"(?:/|$)".to_vec(),
                         build_single_regex(b"rootglob", b"", b"").unwrap()
                     );
                     assert_eq!(
                         br"whatever(?:/|$)".to_vec(),
                         build_single_regex(b"rootglob", b"whatever", b"").unwrap()
                     );
                     assert_eq!(
                         br"[^/]*\.o".to_vec(),
                         build_single_regex(b"rootglob", b"*.o", b"").unwrap()
                     );
                 }
             }

rust/hg-core/src/utils.rs

0 +9 0

+            // utils module
+            //
+            // Copyright 2019 Raphaël Gomès <rgomes@octobus.net>
+            //
+            // This software may be used and distributed according to the terms of the
+            // GNU General Public License version 2 or any later version.
+            //! Contains useful functions, traits, structs, etc. for use in core.
             pub mod files;
             use std::convert::AsMut;
             /// Takes a slice and copies it into an array.
             ///
             /// # Panics
             ///
             /// Will panic if the slice and target array don't have the same length.
             pub fn copy_into_array<A, T>(slice: &[T]) -> A
             where
                 A: Sized + Default + AsMut<[T]>,
                 T: Copy,
             {
                 let mut a = Default::default();
                 <A as AsMut<[T]>>::as_mut(&mut a).copy_from_slice(slice);
                 a
             }
             /// Replaces the `from` slice with the `to` slice inside the `buf` slice.
             ///
             /// # Examples
             ///
             /// ```
             /// use crate::hg::utils::replace_slice;
             /// let mut line = b"I hate writing tests!".to_vec();
             /// replace_slice(&mut line, b"hate", b"love");
             /// assert_eq!(
             ///     line,
             ///     b"I love writing tests!".to_vec()
             ///);
             ///
             /// ```
             pub fn replace_slice<T>(buf: &mut [T], from: &[T], to: &[T])
             where
                 T: Clone + PartialEq,
             {
                 if buf.len() < from.len() || from.len() != to.len() {
                     return;
                 }
                 for i in 0..=buf.len() - from.len() {
                     if buf[i..].starts_with(from) {
                         buf[i..(i + from.len())].clone_from_slice(to);
                     }
                 }
             }
             pub trait SliceExt {
                 fn trim_end(&self) -> &Self;
                 fn trim_start(&self) -> &Self;
                 fn trim(&self) -> &Self;
             }
             fn is_not_whitespace(c: &u8) -> bool {
                 !(*c as char).is_whitespace()
             }
             impl SliceExt for [u8] {
                 fn trim_end(&self) -> &[u8] {
                     if let Some(last) = self.iter().rposition(is_not_whitespace) {
                         &self[..last + 1]
                     } else {
                         &[]
                     }
                 }
                 fn trim_start(&self) -> &[u8] {
                     if let Some(first) = self.iter().position(is_not_whitespace) {
                         &self[first..]
                     } else {
                         &[]
                     }
                 }
                 /// ```
                 /// use hg::utils::SliceExt;
                 /// assert_eq!(
                 ///     b"  to trim  ".trim(),
                 ///     b"to trim"
                 /// );
                 /// assert_eq!(
                 ///     b"to trim  ".trim(),
                 ///     b"to trim"
                 /// );
                 /// assert_eq!(
                 ///     b"  to trim".trim(),
                 ///     b"to trim"
                 /// );
                 /// ```
                 fn trim(&self) -> &[u8] {
                     self.trim_start().trim_end()
                 }
             }

rust/hg-core/src/utils/files.rs

0 +11 0

+            // files.rs
+            //
+            // Copyright 2019
+            // Raphaël Gomès <rgomes@octobus.net>,
+            // Yuya Nishihara <yuya@tcha.org>
+            //
+            // This software may be used and distributed according to the terms of the
+            // GNU General Public License version 2 or any later version.
+            //! Functions for fiddling with files.
             use std::iter::FusedIterator;
             use std::path::Path;
             pub fn get_path_from_bytes(bytes: &[u8]) -> &Path {
                 let os_str;
                 #[cfg(unix)]
                 {
                     use std::os::unix::ffi::OsStrExt;
                     os_str = std::ffi::OsStr::from_bytes(bytes);
                 }
                 #[cfg(windows)]
                 {
                     // TODO: convert from Windows MBCS (ANSI encoding) to WTF8.
                     // Perhaps, the return type would have to be Result<PathBuf>.
                     use std::os::windows::ffi::OsStrExt;
                     os_str = std::ffi::OsString::from_wide(bytes);
                 }
                 Path::new(os_str)
             }
             /// An iterator over repository path yielding itself and its ancestors.
             #[derive(Copy, Clone, Debug)]
             pub struct Ancestors<'a> {
                 next: Option<&'a [u8]>,
             }
             impl<'a> Iterator for Ancestors<'a> {
                 // if we had an HgPath type, this would yield &'a HgPath
                 type Item = &'a [u8];
                 fn next(&mut self) -> Option<Self::Item> {
                     let next = self.next;
                     self.next = match self.next {
                         Some(s) if s.is_empty() => None,
                         Some(s) => {
                             let p = s.iter().rposition(|&c| c == b'/').unwrap_or(0);
                             Some(&s[..p])
                         }
                         None => None,
                     };
                     next
                 }
             }
             impl<'a> FusedIterator for Ancestors<'a> {}
             /// Returns an iterator yielding ancestor directories of the given repository
             /// path.
             ///
             /// The path is separated by '/', and must not start with '/'.
             ///
             /// The path itself isn't included unless it is b"" (meaning the root
             /// directory.)
             pub fn find_dirs<'a>(path: &'a [u8]) -> Ancestors<'a> {
                 let mut dirs = Ancestors { next: Some(path) };
                 if !path.is_empty() {
                     dirs.next(); // skip itself
                 }
                 dirs
             }
             #[cfg(test)]
             mod tests {
                 #[test]
                 fn find_dirs_some() {
                     let mut dirs = super::find_dirs(b"foo/bar/baz");
                     assert_eq!(dirs.next(), Some(b"foo/bar".as_ref()));
                     assert_eq!(dirs.next(), Some(b"foo".as_ref()));
                     assert_eq!(dirs.next(), Some(b"".as_ref()));
                     assert_eq!(dirs.next(), None);
                     assert_eq!(dirs.next(), None);
                 }
                 #[test]
                 fn find_dirs_empty() {
                     // looks weird, but mercurial.util.finddirs(b"") yields b""
                     let mut dirs = super::find_dirs(b"");
                     assert_eq!(dirs.next(), Some(b"".as_ref()));
                     assert_eq!(dirs.next(), None);
                     assert_eq!(dirs.next(), None);
                 }
             }

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages