upstream/mercurial-mirror Commit - r49051:027ebad9

rhg: internally, return a structured representation from hg cat...

Arseniy Alekseyev -

r49051:027ebad9 default

parent child

rust/hg-core/src/operations/cat.rs

0 +26 -26

             // list_tracked_files.rs
             //
             // Copyright 2020 Antoine Cezar <antoine.cezar@octobus.net>
             //
             // This software may be used and distributed according to the terms of the
             // GNU General Public License version 2 or any later version.
             use crate::repo::Repo;
             use crate::revlog::revlog::RevlogError;
             use crate::revlog::Node;
             use crate::utils::hg_path::HgPath;
-            use crate::utils::hg_path::HgPathBuf;
             use itertools::put_back;
             use itertools::PutBack;
             use std::cmp::Ordering;
-            pub struct CatOutput {
+            pub struct CatOutput<'a> {
                 /// Whether any file in the manifest matched the paths given as CLI
                 /// arguments
                 pub found_any: bool,
                 /// The contents of matching files, in manifest order
-                pub concatenated: Vec<u8>,
+                pub results: Vec<(&'a HgPath, Vec<u8>)>,
                 /// Which of the CLI arguments did not match any manifest file
-                pub missing: Vec<HgPathBuf>,
+                pub missing: Vec<&'a HgPath>,
                 /// The node ID that the given revset was resolved to
                 pub node: Node,
             }
             // Find an item in an iterator over a sorted collection.
             fn find_item<'a, 'b, 'c, D, I: Iterator<Item = (&'a HgPath, D)>>(
                 i: &mut PutBack<I>,
                 needle: &'b HgPath,
-            ) -> Option<I::Item> {
+            ) -> Option<D> {
                 loop {
                     match i.next() {
                         None => return None,
                         Some(val) => match needle.as_bytes().cmp(val.0.as_bytes()) {
                             Ordering::Less => {
                                 i.put_back(val);
                                 return None;
                             }
                             Ordering::Greater => continue,
-                            Ordering::Equal => return Some(val),
+                            Ordering::Equal => return Some(val.1),
                         },
                     }
                 }
             }
             fn find_files_in_manifest<
-                'a,
+                'manifest,
-                'b,
+                'query,
-                D,
+                Data,
-                I: Iterator<Item = (&'a HgPath, D)>,
+                Manifest: Iterator<Item = (&'manifest HgPath, Data)>,
-                J: Iterator<Item = &'b HgPath>,
+                Query: Iterator<Item = &'query HgPath>,
             >(
-                manifest: I,
+                manifest: Manifest,
-                files: J,
+                query: Query,
-            ) -> (Vec<(&'a HgPath, D)>, Vec<&'b HgPath>) {
+            ) -> (Vec<(&'query HgPath, Data)>, Vec<&'query HgPath>) {
                 let mut manifest = put_back(manifest);
                 let mut res = vec![];
                 let mut missing = vec![];
-                for file in files {
+                for file in query {
                     match find_item(&mut manifest, file) {
                         None => missing.push(file),
-                        Some(item) => res.push(item),
+                        Some(item) => res.push((file, item)),
                     }
                 }
                 return (res, missing);
             }
             /// Output the given revision of files
             ///
             /// * `root`: Repository root
             /// * `rev`: The revision to cat the files from.
             /// * `files`: The files to output.
             pub fn cat<'a>(
                 repo: &Repo,
                 revset: &str,
-                mut files: Vec<HgPathBuf>,
+                mut files: Vec<&'a HgPath>,
-            ) -> Result<CatOutput, RevlogError> {
+            ) -> Result<CatOutput<'a>, RevlogError> {
                 let rev = crate::revset::resolve_single(revset, repo)?;
                 let manifest = repo.manifest_for_rev(rev)?;
                 let node = *repo
                     .changelog()?
                     .node_from_rev(rev)
                     .expect("should succeed when repo.manifest did");
-                let mut bytes: Vec<u8> = vec![];
+                let mut results: Vec<(&'a HgPath, Vec<u8>)> = vec![];
                 let mut found_any = false;
                 files.sort_unstable();
                 let (found, missing) = find_files_in_manifest(
                     manifest.files_with_nodes(),
-                    files.iter().map(|f| f.as_ref()),
+                    files.into_iter().map(|f| f.as_ref()),
                 );
-                for (manifest_file, node_bytes) in found {
+                for (file_path, node_bytes) in found {
                     found_any = true;
-                    let file_log = repo.filelog(manifest_file)?;
+                    let file_log = repo.filelog(file_path)?;
                     let file_node = Node::from_hex_for_repo(node_bytes)?;
-                    bytes.extend(file_log.data_for_node(file_node)?.data()?);
+                    results.push((
+                        file_path,
+                        file_log.data_for_node(file_node)?.into_data()?,
+                    ));
                 }
-                let missing: Vec<HgPathBuf> =
-                    missing.iter().map(|file| (*file).to_owned()).collect();
                 Ok(CatOutput {
                     found_any,
-                    concatenated: bytes,
+                    results,
                     missing,
                     node,
                 })
             }

rust/hg-core/src/revlog/filelog.rs

0 +25 -6

             use crate::errors::HgError;
             use crate::repo::Repo;
             use crate::revlog::path_encode::path_encode;
             use crate::revlog::revlog::{Revlog, RevlogError};
             use crate::revlog::NodePrefix;
             use crate::revlog::Revision;
             use crate::utils::files::get_path_from_bytes;
             use crate::utils::hg_path::HgPath;
             use crate::utils::SliceExt;
-            use std::borrow::Cow;
             use std::path::PathBuf;
             /// A specialized `Revlog` to work with file data logs.
             pub struct Filelog {
                 /// The generic `revlog` format.
                 revlog: Revlog,
             }
             impl Filelog {
                 pub fn open(repo: &Repo, file_path: &HgPath) -> Result<Self, HgError> {
                     let index_path = store_path(file_path, b".i");
                     let data_path = store_path(file_path, b".d");
                     let revlog = Revlog::open(repo, index_path, Some(&data_path))?;
                     Ok(Self { revlog })
                 }
                 /// The given node ID is that of the file as found in a manifest, not of a
                 /// changeset.
                 pub fn data_for_node(
                     &self,
                     file_node: impl Into<NodePrefix>,
                 ) -> Result<FilelogEntry, RevlogError> {
                     let file_rev = self.revlog.rev_from_node(file_node.into())?;
                     self.data_for_rev(file_rev)
                 }
                 /// The given revision is that of the file as found in a manifest, not of a
                 /// changeset.
                 pub fn data_for_rev(
                     &self,
                     file_rev: Revision,
                 ) -> Result<FilelogEntry, RevlogError> {
-                    let data = self.revlog.get_rev_data(file_rev)?;
+                    let data: Vec<u8> = self.revlog.get_rev_data(file_rev)?;
                     Ok(FilelogEntry(data.into()))
                 }
             }
             fn store_path(hg_path: &HgPath, suffix: &[u8]) -> PathBuf {
                 let encoded_bytes =
                     path_encode(&[b"data/", hg_path.as_bytes(), suffix].concat());
                 get_path_from_bytes(&encoded_bytes).into()
             }
-            pub struct FilelogEntry<'filelog>(Cow<'filelog, [u8]>);
+            pub struct FilelogEntry(Vec<u8>);
-            impl<'filelog> FilelogEntry<'filelog> {
+            impl FilelogEntry {
                 /// Split into metadata and data
-                pub fn split(&self) -> Result<(Option<&[u8]>, &[u8]), HgError> {
+                /// Returns None if there is no metadata, so the entire entry is data.
+                fn split_metadata(&self) -> Result<Option<(&[u8], &[u8])>, HgError> {
                     const DELIMITER: &[u8; 2] = &[b'\x01', b'\n'];
                     if let Some(rest) = self.0.drop_prefix(DELIMITER) {
                         if let Some((metadata, data)) = rest.split_2_by_slice(DELIMITER) {
-                            Ok((Some(metadata), data))
+                            Ok(Some((metadata, data)))
                         } else {
                             Err(HgError::corrupted(
                                 "Missing metadata end delimiter in filelog entry",
                             ))
                         }
                     } else {
+                        Ok(None)
+                    }
+                }
+                /// Split into metadata and data
+                pub fn split(&self) -> Result<(Option<&[u8]>, &[u8]), HgError> {
+                    if let Some((metadata, data)) = self.split_metadata()? {
+                        Ok((Some(metadata), data))
+                    } else {
                         Ok((None, &self.0))
                     }
                 }
                 /// Returns the file contents at this revision, stripped of any metadata
                 pub fn data(&self) -> Result<&[u8], HgError> {
                     let (_metadata, data) = self.split()?;
                     Ok(data)
                 }
+                /// Consume the entry, and convert it into data, discarding any metadata,
+                /// if present.
+                pub fn into_data(self) -> Result<Vec<u8>, HgError> {
+                    if let Some((_metadata, data)) = self.split_metadata()? {
+                        Ok(data.to_owned())
+                    } else {
+                        Ok(self.0)
+                    }
+                }
             }

rust/rhg/src/commands/cat.rs

0 +4 -1

             use crate::error::CommandError;
             use clap::Arg;
             use format_bytes::format_bytes;
             use hg::operations::cat;
             use hg::utils::hg_path::HgPathBuf;
             use micro_timer::timed;
             use std::convert::TryFrom;
             pub const HELP_TEXT: &str = "
             Output the current or given revision of files
             ";
             pub fn args() -> clap::App<'static, 'static> {
                 clap::SubCommand::with_name("cat")
                     .arg(
                         Arg::with_name("rev")
                             .help("search the repository as it is in REV")
                             .short("-r")
                             .long("--rev")
                             .value_name("REV")
                             .takes_value(true),
                     )
                     .arg(
                         clap::Arg::with_name("files")
                             .required(true)
                             .multiple(true)
                             .empty_values(false)
                             .value_name("FILE")
                             .help("Files to output"),
                     )
                     .about(HELP_TEXT)
             }
             #[timed]
             pub fn run(invocation: &crate::CliInvocation) -> Result<(), CommandError> {
                 let rev = invocation.subcommand_args.value_of("rev");
                 let file_args = match invocation.subcommand_args.values_of("files") {
                     Some(files) => files.collect(),
                     None => vec![],
                 };
                 let repo = invocation.repo?;
                 let cwd = hg::utils::current_dir()?;
                 let working_directory = repo.working_directory_path();
                 let working_directory = cwd.join(working_directory); // Make it absolute
                 let mut files = vec![];
                 for file in file_args.iter() {
                     if file.starts_with("set:") {
                         let message = "fileset";
                         return Err(CommandError::unsupported(message));
                     }
                     let normalized = cwd.join(&file);
                     // TODO: actually normalize `..` path segments etc?
                     let dotted = normalized.components().any(|c| c.as_os_str() == "..");
                     if file == &"." || dotted {
                         let message = "`..` or `.` path segment";
                         return Err(CommandError::unsupported(message));
                     }
                     let stripped = normalized
                         .strip_prefix(&working_directory)
                         // TODO: error message for path arguments outside of the repo
                         .map_err(|_| CommandError::abort(""))?;
                     let hg_file = HgPathBuf::try_from(stripped.to_path_buf())
                         .map_err(|e| CommandError::abort(e.to_string()))?;
                     files.push(hg_file);
                 }
+                let files = files.iter().map(|file| file.as_ref()).collect();
                 // TODO probably move this to a util function like `repo.default_rev` or
                 // something when it's used somewhere else
                 let rev = match rev {
                     Some(r) => r.to_string(),
                     None => format!("{:x}", repo.dirstate_parents()?.p1),
                 };
                 let output = cat(&repo, &rev, files).map_err(|e| (e, rev.as_str()))?;
-                invocation.ui.write_stdout(&output.concatenated)?;
+                for (_file, contents) in output.results {
+                    invocation.ui.write_stdout(&contents)?;
+                }
                 if !output.missing.is_empty() {
                     let short = format!("{:x}", output.node.short()).into_bytes();
                     for path in &output.missing {
                         invocation.ui.write_stderr(&format_bytes!(
                             b"{}: no such file in rev {}\n",
                             path.as_bytes(),
                             short
                         ))?;
                     }
                 }
                 if output.found_any {
                     Ok(())
                 } else {
                     Err(CommandError::Unsuccessful)
                 }
             }

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages