dirstate_map.rs
1314 lines
| 42.3 KiB
| application/rls-services+xml
|
RustLexer
Simon Sapin
|
r47872 | use bytes_cast::BytesCast; | ||
Simon Sapin
|
r47888 | use micro_timer::timed; | ||
Simon Sapin
|
r47895 | use std::borrow::Cow; | ||
Simon Sapin
|
r47889 | use std::convert::TryInto; | ||
Simon Sapin
|
r47865 | use std::path::PathBuf; | ||
Simon Sapin
|
r48058 | use super::on_disk; | ||
Simon Sapin
|
r48126 | use super::on_disk::DirstateV2ParseError; | ||
Simon Sapin
|
r47867 | use super::path_with_basename::WithBasename; | ||
Simon Sapin
|
r47872 | use crate::dirstate::parsers::pack_entry; | ||
use crate::dirstate::parsers::packed_entry_size; | ||||
Simon Sapin
|
r47868 | use crate::dirstate::parsers::parse_dirstate_entries; | ||
Simon Sapin
|
r47871 | use crate::dirstate::parsers::Timestamp; | ||
r48310 | use crate::dirstate::MTIME_UNSET; | |||
r48300 | use crate::dirstate::SIZE_FROM_OTHER_PARENT; | |||
use crate::dirstate::SIZE_NON_NORMAL; | ||||
r48310 | use crate::dirstate::V1_RANGEMASK; | |||
Simon Sapin
|
r47865 | use crate::matchers::Matcher; | ||
use crate::utils::hg_path::{HgPath, HgPathBuf}; | ||||
use crate::CopyMapIter; | ||||
use crate::DirstateEntry; | ||||
use crate::DirstateError; | ||||
use crate::DirstateParents; | ||||
use crate::DirstateStatus; | ||||
use crate::EntryState; | ||||
Simon Sapin
|
r47889 | use crate::FastHashMap; | ||
Simon Sapin
|
r47865 | use crate::PatternFileWarning; | ||
use crate::StateMapIter; | ||||
use crate::StatusError; | ||||
use crate::StatusOptions; | ||||
Simon Sapin
|
r48481 | /// Append to an existing data file if the amount of unreachable data (not used | ||
/// anymore) is less than this fraction of the total amount of existing data. | ||||
const ACCEPTABLE_UNREACHABLE_BYTES_RATIO: f32 = 0.5; | ||||
Simon Sapin
|
r47893 | pub struct DirstateMap<'on_disk> { | ||
/// Contents of the `.hg/dirstate` file | ||||
Simon Sapin
|
r48058 | pub(super) on_disk: &'on_disk [u8], | ||
Simon Sapin
|
r47893 | |||
Simon Sapin
|
r47895 | pub(super) root: ChildNodes<'on_disk>, | ||
Simon Sapin
|
r47873 | |||
/// Number of nodes anywhere in the tree that have `.entry.is_some()`. | ||||
Simon Sapin
|
r48058 | pub(super) nodes_with_entry_count: u32, | ||
Simon Sapin
|
r47873 | |||
/// Number of nodes anywhere in the tree that have | ||||
/// `.copy_source.is_some()`. | ||||
Simon Sapin
|
r48058 | pub(super) nodes_with_copy_source_count: u32, | ||
Simon Sapin
|
r48202 | |||
/// See on_disk::Header | ||||
pub(super) ignore_patterns_hash: on_disk::IgnorePatternsHash, | ||||
Simon Sapin
|
r48481 | |||
/// How many bytes of `on_disk` are not used anymore | ||||
pub(super) unreachable_bytes: u32, | ||||
Simon Sapin
|
r47867 | } | ||
/// Using a plain `HgPathBuf` of the full path from the repository root as a | ||||
/// map key would also work: all paths in a given map have the same parent | ||||
/// path, so comparing full paths gives the same result as comparing base | ||||
Simon Sapin
|
r48057 | /// names. However `HashMap` would waste time always re-hashing the same | ||
Simon Sapin
|
r47867 | /// string prefix. | ||
Simon Sapin
|
r48057 | pub(super) type NodeKey<'on_disk> = WithBasename<Cow<'on_disk, HgPath>>; | ||
Simon Sapin
|
r48124 | |||
Simon Sapin
|
r48136 | /// Similar to `&'tree Cow<'on_disk, HgPath>`, but can also be returned | ||
/// for on-disk nodes that don’t actually have a `Cow` to borrow. | ||||
pub(super) enum BorrowedPath<'tree, 'on_disk> { | ||||
InMemory(&'tree HgPathBuf), | ||||
OnDisk(&'on_disk HgPath), | ||||
} | ||||
Simon Sapin
|
r48124 | pub(super) enum ChildNodes<'on_disk> { | ||
InMemory(FastHashMap<NodeKey<'on_disk>, Node<'on_disk>>), | ||||
Simon Sapin
|
r48128 | OnDisk(&'on_disk [on_disk::Node]), | ||
Simon Sapin
|
r48124 | } | ||
pub(super) enum ChildNodesRef<'tree, 'on_disk> { | ||||
InMemory(&'tree FastHashMap<NodeKey<'on_disk>, Node<'on_disk>>), | ||||
Simon Sapin
|
r48128 | OnDisk(&'on_disk [on_disk::Node]), | ||
Simon Sapin
|
r48124 | } | ||
pub(super) enum NodeRef<'tree, 'on_disk> { | ||||
InMemory(&'tree NodeKey<'on_disk>, &'tree Node<'on_disk>), | ||||
Simon Sapin
|
r48128 | OnDisk(&'on_disk on_disk::Node), | ||
Simon Sapin
|
r48124 | } | ||
Simon Sapin
|
r48136 | impl<'tree, 'on_disk> BorrowedPath<'tree, 'on_disk> { | ||
pub fn detach_from_tree(&self) -> Cow<'on_disk, HgPath> { | ||||
match *self { | ||||
BorrowedPath::InMemory(in_memory) => Cow::Owned(in_memory.clone()), | ||||
BorrowedPath::OnDisk(on_disk) => Cow::Borrowed(on_disk), | ||||
} | ||||
} | ||||
} | ||||
impl<'tree, 'on_disk> std::ops::Deref for BorrowedPath<'tree, 'on_disk> { | ||||
type Target = HgPath; | ||||
fn deref(&self) -> &HgPath { | ||||
match *self { | ||||
BorrowedPath::InMemory(in_memory) => in_memory, | ||||
BorrowedPath::OnDisk(on_disk) => on_disk, | ||||
} | ||||
} | ||||
} | ||||
Simon Sapin
|
r48124 | impl Default for ChildNodes<'_> { | ||
fn default() -> Self { | ||||
ChildNodes::InMemory(Default::default()) | ||||
} | ||||
} | ||||
impl<'on_disk> ChildNodes<'on_disk> { | ||||
pub(super) fn as_ref<'tree>( | ||||
&'tree self, | ||||
) -> ChildNodesRef<'tree, 'on_disk> { | ||||
match self { | ||||
ChildNodes::InMemory(nodes) => ChildNodesRef::InMemory(nodes), | ||||
Simon Sapin
|
r48128 | ChildNodes::OnDisk(nodes) => ChildNodesRef::OnDisk(nodes), | ||
Simon Sapin
|
r48124 | } | ||
} | ||||
pub(super) fn is_empty(&self) -> bool { | ||||
match self { | ||||
ChildNodes::InMemory(nodes) => nodes.is_empty(), | ||||
Simon Sapin
|
r48128 | ChildNodes::OnDisk(nodes) => nodes.is_empty(), | ||
Simon Sapin
|
r48124 | } | ||
} | ||||
Simon Sapin
|
r48481 | fn make_mut( | ||
Simon Sapin
|
r48124 | &mut self, | ||
Simon Sapin
|
r48128 | on_disk: &'on_disk [u8], | ||
Simon Sapin
|
r48481 | unreachable_bytes: &mut u32, | ||
Simon Sapin
|
r48126 | ) -> Result< | ||
&mut FastHashMap<NodeKey<'on_disk>, Node<'on_disk>>, | ||||
DirstateV2ParseError, | ||||
> { | ||||
Simon Sapin
|
r48124 | match self { | ||
Simon Sapin
|
r48126 | ChildNodes::InMemory(nodes) => Ok(nodes), | ||
Simon Sapin
|
r48128 | ChildNodes::OnDisk(nodes) => { | ||
Simon Sapin
|
r48481 | *unreachable_bytes += | ||
std::mem::size_of_val::<[on_disk::Node]>(nodes) as u32; | ||||
Simon Sapin
|
r48128 | let nodes = nodes | ||
.iter() | ||||
.map(|node| { | ||||
Ok(( | ||||
node.path(on_disk)?, | ||||
node.to_in_memory_node(on_disk)?, | ||||
)) | ||||
}) | ||||
.collect::<Result<_, _>>()?; | ||||
*self = ChildNodes::InMemory(nodes); | ||||
match self { | ||||
ChildNodes::InMemory(nodes) => Ok(nodes), | ||||
ChildNodes::OnDisk(_) => unreachable!(), | ||||
} | ||||
} | ||||
Simon Sapin
|
r48124 | } | ||
} | ||||
} | ||||
impl<'tree, 'on_disk> ChildNodesRef<'tree, 'on_disk> { | ||||
pub(super) fn get( | ||||
&self, | ||||
base_name: &HgPath, | ||||
Simon Sapin
|
r48128 | on_disk: &'on_disk [u8], | ||
Simon Sapin
|
r48126 | ) -> Result<Option<NodeRef<'tree, 'on_disk>>, DirstateV2ParseError> { | ||
Simon Sapin
|
r48124 | match self { | ||
Simon Sapin
|
r48126 | ChildNodesRef::InMemory(nodes) => Ok(nodes | ||
Simon Sapin
|
r48124 | .get_key_value(base_name) | ||
Simon Sapin
|
r48126 | .map(|(k, v)| NodeRef::InMemory(k, v))), | ||
Simon Sapin
|
r48128 | ChildNodesRef::OnDisk(nodes) => { | ||
let mut parse_result = Ok(()); | ||||
let search_result = nodes.binary_search_by(|node| { | ||||
match node.base_name(on_disk) { | ||||
Ok(node_base_name) => node_base_name.cmp(base_name), | ||||
Err(e) => { | ||||
parse_result = Err(e); | ||||
// Dummy comparison result, `search_result` won’t | ||||
// be used since `parse_result` is an error | ||||
std::cmp::Ordering::Equal | ||||
} | ||||
} | ||||
}); | ||||
parse_result.map(|()| { | ||||
search_result.ok().map(|i| NodeRef::OnDisk(&nodes[i])) | ||||
}) | ||||
} | ||||
Simon Sapin
|
r48124 | } | ||
} | ||||
/// Iterate in undefined order | ||||
pub(super) fn iter( | ||||
&self, | ||||
) -> impl Iterator<Item = NodeRef<'tree, 'on_disk>> { | ||||
match self { | ||||
Simon Sapin
|
r48128 | ChildNodesRef::InMemory(nodes) => itertools::Either::Left( | ||
nodes.iter().map(|(k, v)| NodeRef::InMemory(k, v)), | ||||
), | ||||
ChildNodesRef::OnDisk(nodes) => { | ||||
itertools::Either::Right(nodes.iter().map(NodeRef::OnDisk)) | ||||
Simon Sapin
|
r48124 | } | ||
} | ||||
} | ||||
/// Iterate in parallel in undefined order | ||||
pub(super) fn par_iter( | ||||
&self, | ||||
) -> impl rayon::iter::ParallelIterator<Item = NodeRef<'tree, 'on_disk>> | ||||
{ | ||||
use rayon::prelude::*; | ||||
match self { | ||||
Simon Sapin
|
r48128 | ChildNodesRef::InMemory(nodes) => rayon::iter::Either::Left( | ||
nodes.par_iter().map(|(k, v)| NodeRef::InMemory(k, v)), | ||||
), | ||||
ChildNodesRef::OnDisk(nodes) => rayon::iter::Either::Right( | ||||
nodes.par_iter().map(NodeRef::OnDisk), | ||||
), | ||||
Simon Sapin
|
r48124 | } | ||
} | ||||
pub(super) fn sorted(&self) -> Vec<NodeRef<'tree, 'on_disk>> { | ||||
match self { | ||||
ChildNodesRef::InMemory(nodes) => { | ||||
let mut vec: Vec<_> = nodes | ||||
.iter() | ||||
.map(|(k, v)| NodeRef::InMemory(k, v)) | ||||
.collect(); | ||||
Simon Sapin
|
r48126 | fn sort_key<'a>(node: &'a NodeRef) -> &'a HgPath { | ||
match node { | ||||
NodeRef::InMemory(path, _node) => path.base_name(), | ||||
Simon Sapin
|
r48128 | NodeRef::OnDisk(_) => unreachable!(), | ||
Simon Sapin
|
r48126 | } | ||
} | ||||
Simon Sapin
|
r48124 | // `sort_unstable_by_key` doesn’t allow keys borrowing from the | ||
// value: https://github.com/rust-lang/rust/issues/34162 | ||||
Simon Sapin
|
r48126 | vec.sort_unstable_by(|a, b| sort_key(a).cmp(sort_key(b))); | ||
Simon Sapin
|
r48124 | vec | ||
} | ||||
Simon Sapin
|
r48128 | ChildNodesRef::OnDisk(nodes) => { | ||
// Nodes on disk are already sorted | ||||
nodes.iter().map(NodeRef::OnDisk).collect() | ||||
} | ||||
Simon Sapin
|
r48124 | } | ||
} | ||||
} | ||||
impl<'tree, 'on_disk> NodeRef<'tree, 'on_disk> { | ||||
Simon Sapin
|
r48126 | pub(super) fn full_path( | ||
&self, | ||||
Simon Sapin
|
r48128 | on_disk: &'on_disk [u8], | ||
Simon Sapin
|
r48126 | ) -> Result<&'tree HgPath, DirstateV2ParseError> { | ||
Simon Sapin
|
r48124 | match self { | ||
Simon Sapin
|
r48126 | NodeRef::InMemory(path, _node) => Ok(path.full_path()), | ||
Simon Sapin
|
r48128 | NodeRef::OnDisk(node) => node.full_path(on_disk), | ||
Simon Sapin
|
r48124 | } | ||
} | ||||
Simon Sapin
|
r48136 | /// Returns a `BorrowedPath`, which can be turned into a `Cow<'on_disk, | ||
/// HgPath>` detached from `'tree` | ||||
pub(super) fn full_path_borrowed( | ||||
Simon Sapin
|
r48126 | &self, | ||
Simon Sapin
|
r48128 | on_disk: &'on_disk [u8], | ||
Simon Sapin
|
r48136 | ) -> Result<BorrowedPath<'tree, 'on_disk>, DirstateV2ParseError> { | ||
Simon Sapin
|
r48124 | match self { | ||
Simon Sapin
|
r48136 | NodeRef::InMemory(path, _node) => match path.full_path() { | ||
Cow::Borrowed(on_disk) => Ok(BorrowedPath::OnDisk(on_disk)), | ||||
Cow::Owned(in_memory) => Ok(BorrowedPath::InMemory(in_memory)), | ||||
}, | ||||
Simon Sapin
|
r48128 | NodeRef::OnDisk(node) => { | ||
Simon Sapin
|
r48136 | Ok(BorrowedPath::OnDisk(node.full_path(on_disk)?)) | ||
Simon Sapin
|
r48128 | } | ||
Simon Sapin
|
r48126 | } | ||
} | ||||
pub(super) fn base_name( | ||||
&self, | ||||
Simon Sapin
|
r48128 | on_disk: &'on_disk [u8], | ||
Simon Sapin
|
r48126 | ) -> Result<&'tree HgPath, DirstateV2ParseError> { | ||
match self { | ||||
NodeRef::InMemory(path, _node) => Ok(path.base_name()), | ||||
Simon Sapin
|
r48128 | NodeRef::OnDisk(node) => node.base_name(on_disk), | ||
Simon Sapin
|
r48124 | } | ||
} | ||||
Simon Sapin
|
r48126 | pub(super) fn children( | ||
&self, | ||||
Simon Sapin
|
r48128 | on_disk: &'on_disk [u8], | ||
Simon Sapin
|
r48126 | ) -> Result<ChildNodesRef<'tree, 'on_disk>, DirstateV2ParseError> { | ||
Simon Sapin
|
r48124 | match self { | ||
Simon Sapin
|
r48126 | NodeRef::InMemory(_path, node) => Ok(node.children.as_ref()), | ||
Simon Sapin
|
r48128 | NodeRef::OnDisk(node) => { | ||
Ok(ChildNodesRef::OnDisk(node.children(on_disk)?)) | ||||
} | ||||
Simon Sapin
|
r48124 | } | ||
} | ||||
Simon Sapin
|
r48126 | pub(super) fn has_copy_source(&self) -> bool { | ||
Simon Sapin
|
r48124 | match self { | ||
Simon Sapin
|
r48126 | NodeRef::InMemory(_path, node) => node.copy_source.is_some(), | ||
Simon Sapin
|
r48128 | NodeRef::OnDisk(node) => node.has_copy_source(), | ||
Simon Sapin
|
r48124 | } | ||
} | ||||
Simon Sapin
|
r48126 | pub(super) fn copy_source( | ||
&self, | ||||
Simon Sapin
|
r48128 | on_disk: &'on_disk [u8], | ||
Simon Sapin
|
r48126 | ) -> Result<Option<&'tree HgPath>, DirstateV2ParseError> { | ||
Simon Sapin
|
r48124 | match self { | ||
NodeRef::InMemory(_path, node) => { | ||||
Simon Sapin
|
r48126 | Ok(node.copy_source.as_ref().map(|s| &**s)) | ||
Simon Sapin
|
r48124 | } | ||
Simon Sapin
|
r48128 | NodeRef::OnDisk(node) => node.copy_source(on_disk), | ||
Simon Sapin
|
r48124 | } | ||
} | ||||
Simon Sapin
|
r48126 | pub(super) fn entry( | ||
&self, | ||||
) -> Result<Option<DirstateEntry>, DirstateV2ParseError> { | ||||
Simon Sapin
|
r48124 | match self { | ||
Simon Sapin
|
r48137 | NodeRef::InMemory(_path, node) => { | ||
Ok(node.data.as_entry().copied()) | ||||
} | ||||
Simon Sapin
|
r48128 | NodeRef::OnDisk(node) => node.entry(), | ||
Simon Sapin
|
r48124 | } | ||
} | ||||
Simon Sapin
|
r48126 | |||
pub(super) fn state( | ||||
&self, | ||||
) -> Result<Option<EntryState>, DirstateV2ParseError> { | ||||
Simon Sapin
|
r48124 | match self { | ||
NodeRef::InMemory(_path, node) => { | ||||
Simon Sapin
|
r48137 | Ok(node.data.as_entry().map(|entry| entry.state)) | ||
Simon Sapin
|
r48124 | } | ||
Simon Sapin
|
r48128 | NodeRef::OnDisk(node) => node.state(), | ||
Simon Sapin
|
r48124 | } | ||
} | ||||
Simon Sapin
|
r48138 | pub(super) fn cached_directory_mtime( | ||
&self, | ||||
Simon Sapin
|
r48140 | ) -> Option<&'tree on_disk::Timestamp> { | ||
Simon Sapin
|
r48138 | match self { | ||
NodeRef::InMemory(_path, node) => match &node.data { | ||||
NodeData::CachedDirectory { mtime } => Some(mtime), | ||||
_ => None, | ||||
}, | ||||
NodeRef::OnDisk(node) => node.cached_directory_mtime(), | ||||
} | ||||
} | ||||
Simon Sapin
|
r48272 | pub(super) fn descendants_with_entry_count(&self) -> u32 { | ||
match self { | ||||
NodeRef::InMemory(_path, node) => { | ||||
node.descendants_with_entry_count | ||||
} | ||||
NodeRef::OnDisk(node) => node.descendants_with_entry_count.get(), | ||||
} | ||||
} | ||||
Simon Sapin
|
r48124 | pub(super) fn tracked_descendants_count(&self) -> u32 { | ||
match self { | ||||
NodeRef::InMemory(_path, node) => node.tracked_descendants_count, | ||||
Simon Sapin
|
r48128 | NodeRef::OnDisk(node) => node.tracked_descendants_count.get(), | ||
Simon Sapin
|
r48124 | } | ||
} | ||||
} | ||||
Simon Sapin
|
r47867 | |||
Simon Sapin
|
r47876 | /// Represents a file or a directory | ||
Simon Sapin
|
r47867 | #[derive(Default)] | ||
Simon Sapin
|
r47895 | pub(super) struct Node<'on_disk> { | ||
Simon Sapin
|
r48137 | pub(super) data: NodeData, | ||
Simon Sapin
|
r47876 | |||
Simon Sapin
|
r47895 | pub(super) copy_source: Option<Cow<'on_disk, HgPath>>, | ||
Simon Sapin
|
r47876 | |||
Simon Sapin
|
r47895 | pub(super) children: ChildNodes<'on_disk>, | ||
Simon Sapin
|
r47876 | |||
Simon Sapin
|
r48272 | /// How many (non-inclusive) descendants of this node have an entry. | ||
pub(super) descendants_with_entry_count: u32, | ||||
/// How many (non-inclusive) descendants of this node have an entry whose | ||||
/// state is "tracked". | ||||
Simon Sapin
|
r48058 | pub(super) tracked_descendants_count: u32, | ||
Simon Sapin
|
r47876 | } | ||
Simon Sapin
|
r48137 | pub(super) enum NodeData { | ||
Entry(DirstateEntry), | ||||
CachedDirectory { mtime: on_disk::Timestamp }, | ||||
None, | ||||
} | ||||
impl Default for NodeData { | ||||
fn default() -> Self { | ||||
NodeData::None | ||||
} | ||||
} | ||||
impl NodeData { | ||||
fn has_entry(&self) -> bool { | ||||
match self { | ||||
NodeData::Entry(_) => true, | ||||
_ => false, | ||||
} | ||||
} | ||||
fn as_entry(&self) -> Option<&DirstateEntry> { | ||||
match self { | ||||
NodeData::Entry(entry) => Some(entry), | ||||
_ => None, | ||||
} | ||||
} | ||||
} | ||||
Simon Sapin
|
r47893 | impl<'on_disk> DirstateMap<'on_disk> { | ||
Simon Sapin
|
r48058 | pub(super) fn empty(on_disk: &'on_disk [u8]) -> Self { | ||
Self { | ||||
on_disk, | ||||
root: ChildNodes::default(), | ||||
nodes_with_entry_count: 0, | ||||
nodes_with_copy_source_count: 0, | ||||
Simon Sapin
|
r48202 | ignore_patterns_hash: [0; on_disk::IGNORE_PATTERNS_HASH_LEN], | ||
Simon Sapin
|
r48481 | unreachable_bytes: 0, | ||
Simon Sapin
|
r48058 | } | ||
} | ||||
Simon Sapin
|
r48055 | #[timed] | ||
Simon Sapin
|
r48475 | pub fn new_v2( | ||
on_disk: &'on_disk [u8], | ||||
data_size: usize, | ||||
Simon Sapin
|
r48482 | metadata: &[u8], | ||
Simon Sapin
|
r48475 | ) -> Result<Self, DirstateError> { | ||
if let Some(data) = on_disk.get(..data_size) { | ||||
Simon Sapin
|
r48482 | Ok(on_disk::read(data, metadata)?) | ||
Simon Sapin
|
r48475 | } else { | ||
Err(DirstateV2ParseError.into()) | ||||
} | ||||
Simon Sapin
|
r48055 | } | ||
#[timed] | ||||
pub fn new_v1( | ||||
Simon Sapin
|
r47893 | on_disk: &'on_disk [u8], | ||
) -> Result<(Self, Option<DirstateParents>), DirstateError> { | ||||
Simon Sapin
|
r48058 | let mut map = Self::empty(on_disk); | ||
Simon Sapin
|
r48055 | if map.on_disk.is_empty() { | ||
return Ok((map, None)); | ||||
Simon Sapin
|
r47867 | } | ||
Simon Sapin
|
r47893 | |||
let parents = parse_dirstate_entries( | ||||
Simon Sapin
|
r48055 | map.on_disk, | ||
Simon Sapin
|
r47893 | |path, entry, copy_source| { | ||
let tracked = entry.state.is_tracked(); | ||||
Simon Sapin
|
r47896 | let node = Self::get_or_insert_node( | ||
Simon Sapin
|
r48127 | map.on_disk, | ||
Simon Sapin
|
r48481 | &mut map.unreachable_bytes, | ||
Simon Sapin
|
r48055 | &mut map.root, | ||
Simon Sapin
|
r47893 | path, | ||
Simon Sapin
|
r47896 | WithBasename::to_cow_borrowed, | ||
Simon Sapin
|
r47893 | |ancestor| { | ||
if tracked { | ||||
ancestor.tracked_descendants_count += 1 | ||||
} | ||||
Simon Sapin
|
r48272 | ancestor.descendants_with_entry_count += 1 | ||
Simon Sapin
|
r47893 | }, | ||
Simon Sapin
|
r48126 | )?; | ||
Simon Sapin
|
r47893 | assert!( | ||
Simon Sapin
|
r48137 | !node.data.has_entry(), | ||
Simon Sapin
|
r47893 | "duplicate dirstate entry in read" | ||
); | ||||
assert!( | ||||
node.copy_source.is_none(), | ||||
"duplicate dirstate entry in read" | ||||
); | ||||
Simon Sapin
|
r48137 | node.data = NodeData::Entry(*entry); | ||
Simon Sapin
|
r47895 | node.copy_source = copy_source.map(Cow::Borrowed); | ||
Simon Sapin
|
r48055 | map.nodes_with_entry_count += 1; | ||
Simon Sapin
|
r47893 | if copy_source.is_some() { | ||
Simon Sapin
|
r48055 | map.nodes_with_copy_source_count += 1 | ||
Simon Sapin
|
r47893 | } | ||
Simon Sapin
|
r48126 | Ok(()) | ||
Simon Sapin
|
r47893 | }, | ||
)?; | ||||
Simon Sapin
|
r48055 | let parents = Some(parents.clone()); | ||
Simon Sapin
|
r47893 | |||
Simon Sapin
|
r48055 | Ok((map, parents)) | ||
Simon Sapin
|
r47867 | } | ||
Simon Sapin
|
r48478 | /// Assuming dirstate-v2 format, returns whether the next write should | ||
/// append to the existing data file that contains `self.on_disk` (true), | ||||
/// or create a new data file from scratch (false). | ||||
pub(super) fn write_should_append(&self) -> bool { | ||||
Simon Sapin
|
r48481 | let ratio = self.unreachable_bytes as f32 / self.on_disk.len() as f32; | ||
ratio < ACCEPTABLE_UNREACHABLE_BYTES_RATIO | ||||
Simon Sapin
|
r48478 | } | ||
Simon Sapin
|
r48124 | fn get_node<'tree>( | ||
&'tree self, | ||||
path: &HgPath, | ||||
Simon Sapin
|
r48126 | ) -> Result<Option<NodeRef<'tree, 'on_disk>>, DirstateV2ParseError> { | ||
Simon Sapin
|
r48124 | let mut children = self.root.as_ref(); | ||
Simon Sapin
|
r47869 | let mut components = path.components(); | ||
let mut component = | ||||
components.next().expect("expected at least one components"); | ||||
loop { | ||||
Simon Sapin
|
r48127 | if let Some(child) = children.get(component, self.on_disk)? { | ||
Simon Sapin
|
r48126 | if let Some(next_component) = components.next() { | ||
component = next_component; | ||||
Simon Sapin
|
r48127 | children = child.children(self.on_disk)?; | ||
Simon Sapin
|
r48126 | } else { | ||
return Ok(Some(child)); | ||||
} | ||||
Simon Sapin
|
r47869 | } else { | ||
Simon Sapin
|
r48126 | return Ok(None); | ||
Simon Sapin
|
r47869 | } | ||
} | ||||
} | ||||
Simon Sapin
|
r47876 | /// Returns a mutable reference to the node at `path` if it exists | ||
/// | ||||
Simon Sapin
|
r47873 | /// This takes `root` instead of `&mut self` so that callers can mutate | ||
/// other fields while the returned borrow is still valid | ||||
Simon Sapin
|
r47874 | fn get_node_mut<'tree>( | ||
Simon Sapin
|
r48127 | on_disk: &'on_disk [u8], | ||
Simon Sapin
|
r48481 | unreachable_bytes: &mut u32, | ||
Simon Sapin
|
r47895 | root: &'tree mut ChildNodes<'on_disk>, | ||
Simon Sapin
|
r47874 | path: &HgPath, | ||
Simon Sapin
|
r48126 | ) -> Result<Option<&'tree mut Node<'on_disk>>, DirstateV2ParseError> { | ||
Simon Sapin
|
r47874 | let mut children = root; | ||
let mut components = path.components(); | ||||
let mut component = | ||||
components.next().expect("expected at least one components"); | ||||
loop { | ||||
Simon Sapin
|
r48481 | if let Some(child) = children | ||
.make_mut(on_disk, unreachable_bytes)? | ||||
.get_mut(component) | ||||
Simon Sapin
|
r48127 | { | ||
Simon Sapin
|
r48126 | if let Some(next_component) = components.next() { | ||
component = next_component; | ||||
children = &mut child.children; | ||||
} else { | ||||
return Ok(Some(child)); | ||||
} | ||||
Simon Sapin
|
r47874 | } else { | ||
Simon Sapin
|
r48126 | return Ok(None); | ||
Simon Sapin
|
r47874 | } | ||
} | ||||
} | ||||
Simon Sapin
|
r48268 | pub(super) fn get_or_insert<'tree, 'path>( | ||
&'tree mut self, | ||||
path: &HgPath, | ||||
) -> Result<&'tree mut Node<'on_disk>, DirstateV2ParseError> { | ||||
Self::get_or_insert_node( | ||||
self.on_disk, | ||||
Simon Sapin
|
r48481 | &mut self.unreachable_bytes, | ||
Simon Sapin
|
r48268 | &mut self.root, | ||
path, | ||||
WithBasename::to_cow_owned, | ||||
|_| {}, | ||||
) | ||||
} | ||||
Simon Sapin
|
r48481 | fn get_or_insert_node<'tree, 'path>( | ||
Simon Sapin
|
r48127 | on_disk: &'on_disk [u8], | ||
Simon Sapin
|
r48481 | unreachable_bytes: &mut u32, | ||
Simon Sapin
|
r47895 | root: &'tree mut ChildNodes<'on_disk>, | ||
Simon Sapin
|
r47896 | path: &'path HgPath, | ||
to_cow: impl Fn( | ||||
WithBasename<&'path HgPath>, | ||||
) -> WithBasename<Cow<'on_disk, HgPath>>, | ||||
Simon Sapin
|
r47890 | mut each_ancestor: impl FnMut(&mut Node), | ||
Simon Sapin
|
r48126 | ) -> Result<&'tree mut Node<'on_disk>, DirstateV2ParseError> { | ||
Simon Sapin
|
r47873 | let mut child_nodes = root; | ||
Simon Sapin
|
r47867 | let mut inclusive_ancestor_paths = | ||
WithBasename::inclusive_ancestors_of(path); | ||||
let mut ancestor_path = inclusive_ancestor_paths | ||||
.next() | ||||
.expect("expected at least one inclusive ancestor"); | ||||
loop { | ||||
Simon Sapin
|
r47886 | // TODO: can we avoid allocating an owned key in cases where the | ||
// map already contains that key, without introducing double | ||||
// lookup? | ||||
Simon Sapin
|
r48124 | let child_node = child_nodes | ||
Simon Sapin
|
r48481 | .make_mut(on_disk, unreachable_bytes)? | ||
Simon Sapin
|
r48124 | .entry(to_cow(ancestor_path)) | ||
.or_default(); | ||||
Simon Sapin
|
r47867 | if let Some(next) = inclusive_ancestor_paths.next() { | ||
Simon Sapin
|
r47890 | each_ancestor(child_node); | ||
Simon Sapin
|
r47867 | ancestor_path = next; | ||
child_nodes = &mut child_node.children; | ||||
} else { | ||||
Simon Sapin
|
r48126 | return Ok(child_node); | ||
Simon Sapin
|
r47867 | } | ||
} | ||||
Simon Sapin
|
r47865 | } | ||
Simon Sapin
|
r47870 | |||
Simon Sapin
|
r47890 | fn add_or_remove_file( | ||
Simon Sapin
|
r47873 | &mut self, | ||
path: &HgPath, | ||||
Simon Sapin
|
r47890 | old_state: EntryState, | ||
Simon Sapin
|
r47873 | new_entry: DirstateEntry, | ||
Simon Sapin
|
r48126 | ) -> Result<(), DirstateV2ParseError> { | ||
Simon Sapin
|
r48272 | let had_entry = old_state != EntryState::Unknown; | ||
Simon Sapin
|
r47876 | let tracked_count_increment = | ||
Simon Sapin
|
r47890 | match (old_state.is_tracked(), new_entry.state.is_tracked()) { | ||
Simon Sapin
|
r47876 | (false, true) => 1, | ||
(true, false) => -1, | ||||
_ => 0, | ||||
}; | ||||
Simon Sapin
|
r47896 | let node = Self::get_or_insert_node( | ||
Simon Sapin
|
r48127 | self.on_disk, | ||
Simon Sapin
|
r48481 | &mut self.unreachable_bytes, | ||
Simon Sapin
|
r47890 | &mut self.root, | ||
path, | ||||
Simon Sapin
|
r47896 | WithBasename::to_cow_owned, | ||
Simon Sapin
|
r47890 | |ancestor| { | ||
Simon Sapin
|
r48272 | if !had_entry { | ||
ancestor.descendants_with_entry_count += 1; | ||||
} | ||||
Simon Sapin
|
r47890 | // We can’t use `+= increment` because the counter is unsigned, | ||
// and we want debug builds to detect accidental underflow | ||||
// through zero | ||||
match tracked_count_increment { | ||||
1 => ancestor.tracked_descendants_count += 1, | ||||
-1 => ancestor.tracked_descendants_count -= 1, | ||||
_ => {} | ||||
} | ||||
}, | ||||
Simon Sapin
|
r48126 | )?; | ||
Simon Sapin
|
r48272 | if !had_entry { | ||
Simon Sapin
|
r47890 | self.nodes_with_entry_count += 1 | ||
Simon Sapin
|
r47873 | } | ||
Simon Sapin
|
r48137 | node.data = NodeData::Entry(new_entry); | ||
Simon Sapin
|
r48126 | Ok(()) | ||
Simon Sapin
|
r47873 | } | ||
Simon Sapin
|
r48124 | fn iter_nodes<'tree>( | ||
&'tree self, | ||||
Simon Sapin
|
r48126 | ) -> impl Iterator< | ||
Item = Result<NodeRef<'tree, 'on_disk>, DirstateV2ParseError>, | ||||
> + 'tree { | ||||
Simon Sapin
|
r47870 | // Depth first tree traversal. | ||
// | ||||
// If we could afford internal iteration and recursion, | ||||
// this would look like: | ||||
// | ||||
// ``` | ||||
// fn traverse_children( | ||||
// children: &ChildNodes, | ||||
// each: &mut impl FnMut(&Node), | ||||
// ) { | ||||
// for child in children.values() { | ||||
// traverse_children(&child.children, each); | ||||
// each(child); | ||||
// } | ||||
// } | ||||
// ``` | ||||
// | ||||
// However we want an external iterator and therefore can’t use the | ||||
// call stack. Use an explicit stack instead: | ||||
let mut stack = Vec::new(); | ||||
Simon Sapin
|
r48124 | let mut iter = self.root.as_ref().iter(); | ||
Simon Sapin
|
r47870 | std::iter::from_fn(move || { | ||
Simon Sapin
|
r48124 | while let Some(child_node) = iter.next() { | ||
Simon Sapin
|
r48127 | let children = match child_node.children(self.on_disk) { | ||
Simon Sapin
|
r48126 | Ok(children) => children, | ||
Err(error) => return Some(Err(error)), | ||||
}; | ||||
Simon Sapin
|
r47870 | // Pseudo-recursion | ||
Simon Sapin
|
r48126 | let new_iter = children.iter(); | ||
Simon Sapin
|
r47870 | let old_iter = std::mem::replace(&mut iter, new_iter); | ||
Simon Sapin
|
r48124 | stack.push((child_node, old_iter)); | ||
Simon Sapin
|
r47870 | } | ||
// Found the end of a `children.iter()` iterator. | ||||
Simon Sapin
|
r48124 | if let Some((child_node, next_iter)) = stack.pop() { | ||
Simon Sapin
|
r47870 | // "Return" from pseudo-recursion by restoring state from the | ||
// explicit stack | ||||
iter = next_iter; | ||||
Simon Sapin
|
r48126 | Some(Ok(child_node)) | ||
Simon Sapin
|
r47870 | } else { | ||
// Reached the bottom of the stack, we’re done | ||||
None | ||||
} | ||||
}) | ||||
} | ||||
Simon Sapin
|
r48126 | fn clear_known_ambiguous_mtimes( | ||
&mut self, | ||||
paths: &[impl AsRef<HgPath>], | ||||
) -> Result<(), DirstateV2ParseError> { | ||||
Simon Sapin
|
r48121 | for path in paths { | ||
Simon Sapin
|
r48127 | if let Some(node) = Self::get_node_mut( | ||
self.on_disk, | ||||
Simon Sapin
|
r48481 | &mut self.unreachable_bytes, | ||
Simon Sapin
|
r48127 | &mut self.root, | ||
path.as_ref(), | ||||
)? { | ||||
Simon Sapin
|
r48137 | if let NodeData::Entry(entry) = &mut node.data { | ||
Simon Sapin
|
r48121 | entry.clear_mtime(); | ||
} | ||||
Simon Sapin
|
r47870 | } | ||
Simon Sapin
|
r48121 | } | ||
Simon Sapin
|
r48126 | Ok(()) | ||
Simon Sapin
|
r47870 | } | ||
Simon Sapin
|
r48126 | |||
/// Return a faillilble iterator of full paths of nodes that have an | ||||
/// `entry` for which the given `predicate` returns true. | ||||
/// | ||||
/// Fallibility means that each iterator item is a `Result`, which may | ||||
/// indicate a parse error of the on-disk dirstate-v2 format. Such errors | ||||
/// should only happen if Mercurial is buggy or a repository is corrupted. | ||||
fn filter_full_paths<'tree>( | ||||
&'tree self, | ||||
predicate: impl Fn(&DirstateEntry) -> bool + 'tree, | ||||
) -> impl Iterator<Item = Result<&HgPath, DirstateV2ParseError>> + 'tree | ||||
{ | ||||
filter_map_results(self.iter_nodes(), move |node| { | ||||
if let Some(entry) = node.entry()? { | ||||
if predicate(&entry) { | ||||
Simon Sapin
|
r48127 | return Ok(Some(node.full_path(self.on_disk)?)); | ||
Simon Sapin
|
r48126 | } | ||
} | ||||
Ok(None) | ||||
}) | ||||
} | ||||
Simon Sapin
|
r48481 | |||
fn count_dropped_path(unreachable_bytes: &mut u32, path: &Cow<HgPath>) { | ||||
if let Cow::Borrowed(path) = path { | ||||
*unreachable_bytes += path.len() as u32 | ||||
} | ||||
} | ||||
Simon Sapin
|
r48126 | } | ||
/// Like `Iterator::filter_map`, but over a fallible iterator of `Result`s. | ||||
/// | ||||
/// The callback is only called for incoming `Ok` values. Errors are passed | ||||
/// through as-is. In order to let it use the `?` operator the callback is | ||||
/// expected to return a `Result` of `Option`, instead of an `Option` of | ||||
/// `Result`. | ||||
fn filter_map_results<'a, I, F, A, B, E>( | ||||
iter: I, | ||||
f: F, | ||||
) -> impl Iterator<Item = Result<B, E>> + 'a | ||||
where | ||||
I: Iterator<Item = Result<A, E>> + 'a, | ||||
F: Fn(A) -> Result<Option<B>, E> + 'a, | ||||
{ | ||||
iter.filter_map(move |result| match result { | ||||
Ok(node) => f(node).transpose(), | ||||
Err(e) => Some(Err(e)), | ||||
}) | ||||
Simon Sapin
|
r47865 | } | ||
Simon Sapin
|
r47893 | impl<'on_disk> super::dispatch::DirstateMapMethods for DirstateMap<'on_disk> { | ||
Simon Sapin
|
r47865 | fn clear(&mut self) { | ||
Simon Sapin
|
r48124 | self.root = Default::default(); | ||
Simon Sapin
|
r47873 | self.nodes_with_entry_count = 0; | ||
self.nodes_with_copy_source_count = 0; | ||||
Simon Sapin
|
r47865 | } | ||
r48492 | fn set_v1(&mut self, filename: &HgPath, entry: DirstateEntry) { | |||
let node = | ||||
self.get_or_insert(&filename).expect("no parse error in v1"); | ||||
node.data = NodeData::Entry(entry); | ||||
node.children = ChildNodes::default(); | ||||
node.copy_source = None; | ||||
node.descendants_with_entry_count = 0; | ||||
node.tracked_descendants_count = 0; | ||||
} | ||||
Simon Sapin
|
r47865 | fn add_file( | ||
&mut self, | ||||
Simon Sapin
|
r47877 | filename: &HgPath, | ||
entry: DirstateEntry, | ||||
r48314 | added: bool, | |||
r48316 | merged: bool, | |||
r48310 | from_p2: bool, | |||
possibly_dirty: bool, | ||||
Simon Sapin
|
r48126 | ) -> Result<(), DirstateError> { | ||
r48310 | let mut entry = entry; | |||
r48314 | if added { | |||
r48310 | assert!(!possibly_dirty); | |||
assert!(!from_p2); | ||||
r48314 | entry.state = EntryState::Added; | |||
r48310 | entry.size = SIZE_NON_NORMAL; | |||
entry.mtime = MTIME_UNSET; | ||||
r48316 | } else if merged { | |||
assert!(!possibly_dirty); | ||||
assert!(!from_p2); | ||||
entry.state = EntryState::Merged; | ||||
entry.size = SIZE_FROM_OTHER_PARENT; | ||||
entry.mtime = MTIME_UNSET; | ||||
r48310 | } else if from_p2 { | |||
assert!(!possibly_dirty); | ||||
r48318 | entry.state = EntryState::Normal; | |||
r48310 | entry.size = SIZE_FROM_OTHER_PARENT; | |||
entry.mtime = MTIME_UNSET; | ||||
} else if possibly_dirty { | ||||
r48317 | entry.state = EntryState::Normal; | |||
r48310 | entry.size = SIZE_NON_NORMAL; | |||
entry.mtime = MTIME_UNSET; | ||||
} else { | ||||
r48319 | entry.state = EntryState::Normal; | |||
r48310 | entry.size = entry.size & V1_RANGEMASK; | |||
entry.mtime = entry.mtime & V1_RANGEMASK; | ||||
} | ||||
r48313 | let old_state = match self.get(filename)? { | |||
Some(e) => e.state, | ||||
None => EntryState::Unknown, | ||||
}; | ||||
Simon Sapin
|
r48126 | Ok(self.add_or_remove_file(filename, old_state, entry)?) | ||
Simon Sapin
|
r47865 | } | ||
fn remove_file( | ||||
&mut self, | ||||
Simon Sapin
|
r47877 | filename: &HgPath, | ||
r48300 | in_merge: bool, | |||
Simon Sapin
|
r48126 | ) -> Result<(), DirstateError> { | ||
r48300 | let old_entry_opt = self.get(filename)?; | |||
let old_state = match old_entry_opt { | ||||
Some(e) => e.state, | ||||
None => EntryState::Unknown, | ||||
}; | ||||
let mut size = 0; | ||||
if in_merge { | ||||
// XXX we should not be able to have 'm' state and 'FROM_P2' if not | ||||
// during a merge. So I (marmoute) am not sure we need the | ||||
// conditionnal at all. Adding double checking this with assert | ||||
// would be nice. | ||||
if let Some(old_entry) = old_entry_opt { | ||||
// backup the previous state | ||||
if old_entry.state == EntryState::Merged { | ||||
size = SIZE_NON_NORMAL; | ||||
} else if old_entry.state == EntryState::Normal | ||||
&& old_entry.size == SIZE_FROM_OTHER_PARENT | ||||
{ | ||||
// other parent | ||||
size = SIZE_FROM_OTHER_PARENT; | ||||
} | ||||
} | ||||
} | ||||
if size == 0 { | ||||
self.copy_map_remove(filename)?; | ||||
} | ||||
Simon Sapin
|
r47877 | let entry = DirstateEntry { | ||
state: EntryState::Removed, | ||||
mode: 0, | ||||
size, | ||||
mtime: 0, | ||||
}; | ||||
Simon Sapin
|
r48126 | Ok(self.add_or_remove_file(filename, old_state, entry)?) | ||
Simon Sapin
|
r47865 | } | ||
r48324 | fn drop_file(&mut self, filename: &HgPath) -> Result<bool, DirstateError> { | |||
let old_state = match self.get(filename)? { | ||||
Some(e) => e.state, | ||||
None => EntryState::Unknown, | ||||
}; | ||||
Simon Sapin
|
r47963 | struct Dropped { | ||
was_tracked: bool, | ||||
had_entry: bool, | ||||
had_copy_source: bool, | ||||
} | ||||
Simon Sapin
|
r48141 | |||
/// If this returns `Ok(Some((dropped, removed)))`, then | ||||
/// | ||||
/// * `dropped` is about the leaf node that was at `filename` | ||||
/// * `removed` is whether this particular level of recursion just | ||||
/// removed a node in `nodes`. | ||||
Simon Sapin
|
r48127 | fn recur<'on_disk>( | ||
on_disk: &'on_disk [u8], | ||||
Simon Sapin
|
r48481 | unreachable_bytes: &mut u32, | ||
Simon Sapin
|
r48127 | nodes: &mut ChildNodes<'on_disk>, | ||
Simon Sapin
|
r48126 | path: &HgPath, | ||
Simon Sapin
|
r48141 | ) -> Result<Option<(Dropped, bool)>, DirstateV2ParseError> { | ||
Simon Sapin
|
r47963 | let (first_path_component, rest_of_path) = | ||
path.split_first_component(); | ||||
Simon Sapin
|
r48481 | let nodes = nodes.make_mut(on_disk, unreachable_bytes)?; | ||
let node = if let Some(node) = nodes.get_mut(first_path_component) | ||||
Simon Sapin
|
r48126 | { | ||
node | ||||
} else { | ||||
return Ok(None); | ||||
}; | ||||
Simon Sapin
|
r47963 | let dropped; | ||
if let Some(rest) = rest_of_path { | ||||
Simon Sapin
|
r48481 | if let Some((d, removed)) = recur( | ||
on_disk, | ||||
unreachable_bytes, | ||||
&mut node.children, | ||||
rest, | ||||
)? { | ||||
Simon Sapin
|
r48126 | dropped = d; | ||
Simon Sapin
|
r48272 | if dropped.had_entry { | ||
node.descendants_with_entry_count -= 1; | ||||
} | ||||
Simon Sapin
|
r48126 | if dropped.was_tracked { | ||
node.tracked_descendants_count -= 1; | ||||
} | ||||
Simon Sapin
|
r48141 | |||
// Directory caches must be invalidated when removing a | ||||
// child node | ||||
if removed { | ||||
if let NodeData::CachedDirectory { .. } = &node.data { | ||||
node.data = NodeData::None | ||||
} | ||||
} | ||||
Simon Sapin
|
r48126 | } else { | ||
return Ok(None); | ||||
Simon Sapin
|
r47890 | } | ||
Simon Sapin
|
r47963 | } else { | ||
Simon Sapin
|
r48137 | let had_entry = node.data.has_entry(); | ||
if had_entry { | ||||
node.data = NodeData::None | ||||
} | ||||
Simon Sapin
|
r48481 | if let Some(source) = &node.copy_source { | ||
DirstateMap::count_dropped_path(unreachable_bytes, source) | ||||
} | ||||
Simon Sapin
|
r47963 | dropped = Dropped { | ||
was_tracked: node | ||||
Simon Sapin
|
r48137 | .data | ||
.as_entry() | ||||
Simon Sapin
|
r47963 | .map_or(false, |entry| entry.state.is_tracked()), | ||
Simon Sapin
|
r48137 | had_entry, | ||
Simon Sapin
|
r47963 | had_copy_source: node.copy_source.take().is_some(), | ||
}; | ||||
Simon Sapin
|
r47964 | } | ||
// After recursion, for both leaf (rest_of_path is None) nodes and | ||||
// parent nodes, remove a node if it just became empty. | ||||
Simon Sapin
|
r48141 | let remove = !node.data.has_entry() | ||
Simon Sapin
|
r47964 | && node.copy_source.is_none() | ||
Simon Sapin
|
r48141 | && node.children.is_empty(); | ||
if remove { | ||||
Simon Sapin
|
r48481 | let (key, _) = | ||
nodes.remove_entry(first_path_component).unwrap(); | ||||
DirstateMap::count_dropped_path( | ||||
unreachable_bytes, | ||||
key.full_path(), | ||||
) | ||||
Simon Sapin
|
r47963 | } | ||
Simon Sapin
|
r48141 | Ok(Some((dropped, remove))) | ||
Simon Sapin
|
r47963 | } | ||
Simon Sapin
|
r47877 | |||
Simon Sapin
|
r48481 | if let Some((dropped, _removed)) = recur( | ||
self.on_disk, | ||||
&mut self.unreachable_bytes, | ||||
&mut self.root, | ||||
filename, | ||||
)? { | ||||
Simon Sapin
|
r47963 | if dropped.had_entry { | ||
Simon Sapin
|
r47877 | self.nodes_with_entry_count -= 1 | ||
} | ||||
Simon Sapin
|
r47963 | if dropped.had_copy_source { | ||
Simon Sapin
|
r47877 | self.nodes_with_copy_source_count -= 1 | ||
} | ||||
Simon Sapin
|
r47963 | Ok(dropped.had_entry) | ||
Simon Sapin
|
r47877 | } else { | ||
Simon Sapin
|
r47963 | debug_assert!(!old_state.is_tracked()); | ||
Simon Sapin
|
r47877 | Ok(false) | ||
} | ||||
Simon Sapin
|
r47865 | } | ||
Simon Sapin
|
r48126 | fn clear_ambiguous_times( | ||
&mut self, | ||||
filenames: Vec<HgPathBuf>, | ||||
now: i32, | ||||
) -> Result<(), DirstateV2ParseError> { | ||||
Simon Sapin
|
r47875 | for filename in filenames { | ||
Simon Sapin
|
r48481 | if let Some(node) = Self::get_node_mut( | ||
self.on_disk, | ||||
&mut self.unreachable_bytes, | ||||
&mut self.root, | ||||
&filename, | ||||
)? { | ||||
Simon Sapin
|
r48137 | if let NodeData::Entry(entry) = &mut node.data { | ||
Simon Sapin
|
r48121 | entry.clear_ambiguous_mtime(now); | ||
Simon Sapin
|
r47875 | } | ||
} | ||||
} | ||||
Simon Sapin
|
r48126 | Ok(()) | ||
Simon Sapin
|
r47865 | } | ||
Simon Sapin
|
r48126 | fn non_normal_entries_contains( | ||
&mut self, | ||||
key: &HgPath, | ||||
) -> Result<bool, DirstateV2ParseError> { | ||||
Ok(if let Some(node) = self.get_node(key)? { | ||||
node.entry()?.map_or(false, |entry| entry.is_non_normal()) | ||||
} else { | ||||
false | ||||
}) | ||||
Simon Sapin
|
r47865 | } | ||
r48492 | fn non_normal_entries_remove(&mut self, key: &HgPath) -> bool { | |||
// Do nothing, this `DirstateMap` does not have a separate "non normal | ||||
// entries" set that need to be kept up to date. | ||||
if let Ok(Some(v)) = self.get(key) { | ||||
return v.is_non_normal(); | ||||
} | ||||
false | ||||
} | ||||
fn non_normal_entries_add(&mut self, _key: &HgPath) { | ||||
Simon Sapin
|
r47878 | // Do nothing, this `DirstateMap` does not have a separate "non normal | ||
// entries" set that need to be kept up to date | ||||
Simon Sapin
|
r47865 | } | ||
fn non_normal_or_other_parent_paths( | ||||
&mut self, | ||||
Simon Sapin
|
r48126 | ) -> Box<dyn Iterator<Item = Result<&HgPath, DirstateV2ParseError>> + '_> | ||
{ | ||||
Box::new(self.filter_full_paths(|entry| { | ||||
entry.is_non_normal() || entry.is_from_other_parent() | ||||
Simon Sapin
|
r47878 | })) | ||
Simon Sapin
|
r47865 | } | ||
fn set_non_normal_other_parent_entries(&mut self, _force: bool) { | ||||
Simon Sapin
|
r47878 | // Do nothing, this `DirstateMap` does not have a separate "non normal | ||
// entries" and "from other parent" sets that need to be recomputed | ||||
Simon Sapin
|
r47865 | } | ||
fn iter_non_normal_paths( | ||||
&mut self, | ||||
Simon Sapin
|
r48126 | ) -> Box< | ||
dyn Iterator<Item = Result<&HgPath, DirstateV2ParseError>> + Send + '_, | ||||
> { | ||||
Simon Sapin
|
r47878 | self.iter_non_normal_paths_panic() | ||
Simon Sapin
|
r47865 | } | ||
fn iter_non_normal_paths_panic( | ||||
&self, | ||||
Simon Sapin
|
r48126 | ) -> Box< | ||
dyn Iterator<Item = Result<&HgPath, DirstateV2ParseError>> + Send + '_, | ||||
> { | ||||
Box::new(self.filter_full_paths(|entry| entry.is_non_normal())) | ||||
Simon Sapin
|
r47865 | } | ||
fn iter_other_parent_paths( | ||||
&mut self, | ||||
Simon Sapin
|
r48126 | ) -> Box< | ||
dyn Iterator<Item = Result<&HgPath, DirstateV2ParseError>> + Send + '_, | ||||
> { | ||||
Box::new(self.filter_full_paths(|entry| entry.is_from_other_parent())) | ||||
Simon Sapin
|
r47865 | } | ||
fn has_tracked_dir( | ||||
&mut self, | ||||
Simon Sapin
|
r47876 | directory: &HgPath, | ||
Simon Sapin
|
r48126 | ) -> Result<bool, DirstateError> { | ||
if let Some(node) = self.get_node(directory)? { | ||||
Simon Sapin
|
r47876 | // A node without a `DirstateEntry` was created to hold child | ||
// nodes, and is therefore a directory. | ||||
Simon Sapin
|
r48137 | let state = node.state()?; | ||
Ok(state.is_none() && node.tracked_descendants_count() > 0) | ||||
Simon Sapin
|
r47876 | } else { | ||
Ok(false) | ||||
} | ||||
Simon Sapin
|
r47865 | } | ||
Simon Sapin
|
r48126 | fn has_dir(&mut self, directory: &HgPath) -> Result<bool, DirstateError> { | ||
if let Some(node) = self.get_node(directory)? { | ||||
Simon Sapin
|
r47876 | // A node without a `DirstateEntry` was created to hold child | ||
// nodes, and is therefore a directory. | ||||
Simon Sapin
|
r48272 | let state = node.state()?; | ||
Ok(state.is_none() && node.descendants_with_entry_count() > 0) | ||||
Simon Sapin
|
r47876 | } else { | ||
Ok(false) | ||||
} | ||||
Simon Sapin
|
r47865 | } | ||
Simon Sapin
|
r48055 | #[timed] | ||
fn pack_v1( | ||||
Simon Sapin
|
r47865 | &mut self, | ||
Simon Sapin
|
r47872 | parents: DirstateParents, | ||
now: Timestamp, | ||||
Simon Sapin
|
r47865 | ) -> Result<Vec<u8>, DirstateError> { | ||
Simon Sapin
|
r48121 | let now: i32 = now.0.try_into().expect("time overflow"); | ||
let mut ambiguous_mtimes = Vec::new(); | ||||
Simon Sapin
|
r47872 | // Optizimation (to be measured?): pre-compute size to avoid `Vec` | ||
// reallocations | ||||
let mut size = parents.as_bytes().len(); | ||||
Simon Sapin
|
r48124 | for node in self.iter_nodes() { | ||
Simon Sapin
|
r48126 | let node = node?; | ||
if let Some(entry) = node.entry()? { | ||||
Simon Sapin
|
r48127 | size += packed_entry_size( | ||
node.full_path(self.on_disk)?, | ||||
node.copy_source(self.on_disk)?, | ||||
); | ||||
Simon Sapin
|
r48121 | if entry.mtime_is_ambiguous(now) { | ||
Simon Sapin
|
r48136 | ambiguous_mtimes.push( | ||
node.full_path_borrowed(self.on_disk)? | ||||
.detach_from_tree(), | ||||
) | ||||
Simon Sapin
|
r48121 | } | ||
Simon Sapin
|
r47872 | } | ||
} | ||||
Simon Sapin
|
r48126 | self.clear_known_ambiguous_mtimes(&ambiguous_mtimes)?; | ||
Simon Sapin
|
r47872 | |||
let mut packed = Vec::with_capacity(size); | ||||
packed.extend(parents.as_bytes()); | ||||
Simon Sapin
|
r48124 | for node in self.iter_nodes() { | ||
Simon Sapin
|
r48126 | let node = node?; | ||
if let Some(entry) = node.entry()? { | ||||
Simon Sapin
|
r47872 | pack_entry( | ||
Simon Sapin
|
r48127 | node.full_path(self.on_disk)?, | ||
Simon Sapin
|
r48124 | &entry, | ||
Simon Sapin
|
r48127 | node.copy_source(self.on_disk)?, | ||
Simon Sapin
|
r47872 | &mut packed, | ||
); | ||||
} | ||||
} | ||||
Ok(packed) | ||||
Simon Sapin
|
r47865 | } | ||
Simon Sapin
|
r48482 | /// Returns new data and metadata together with whether that data should be | ||
/// appended to the existing data file whose content is at | ||||
/// `self.on_disk` (true), instead of written to a new data file | ||||
/// (false). | ||||
Simon Sapin
|
r48055 | #[timed] | ||
Simon Sapin
|
r48478 | fn pack_v2( | ||
&mut self, | ||||
now: Timestamp, | ||||
can_append: bool, | ||||
Simon Sapin
|
r48482 | ) -> Result<(Vec<u8>, Vec<u8>, bool), DirstateError> { | ||
Simon Sapin
|
r48121 | // TODO:Â how do we want to handle this in 2038? | ||
let now: i32 = now.0.try_into().expect("time overflow"); | ||||
let mut paths = Vec::new(); | ||||
Simon Sapin
|
r48124 | for node in self.iter_nodes() { | ||
Simon Sapin
|
r48126 | let node = node?; | ||
if let Some(entry) = node.entry()? { | ||||
Simon Sapin
|
r48121 | if entry.mtime_is_ambiguous(now) { | ||
Simon Sapin
|
r48136 | paths.push( | ||
node.full_path_borrowed(self.on_disk)? | ||||
.detach_from_tree(), | ||||
) | ||||
Simon Sapin
|
r48121 | } | ||
} | ||||
} | ||||
// Borrow of `self` ends here since we collect cloned paths | ||||
Simon Sapin
|
r48126 | self.clear_known_ambiguous_mtimes(&paths)?; | ||
Simon Sapin
|
r48121 | |||
Simon Sapin
|
r48478 | on_disk::write(self, can_append) | ||
Simon Sapin
|
r48055 | } | ||
Simon Sapin
|
r47865 | fn status<'a>( | ||
Simon Sapin
|
r47882 | &'a mut self, | ||
matcher: &'a (dyn Matcher + Sync), | ||||
root_dir: PathBuf, | ||||
ignore_files: Vec<PathBuf>, | ||||
options: StatusOptions, | ||||
Simon Sapin
|
r47880 | ) -> Result<(DirstateStatus<'a>, Vec<PatternFileWarning>), StatusError> | ||
{ | ||||
Simon Sapin
|
r47882 | super::status::status(self, matcher, root_dir, ignore_files, options) | ||
Simon Sapin
|
r47865 | } | ||
fn copy_map_len(&self) -> usize { | ||||
Simon Sapin
|
r48058 | self.nodes_with_copy_source_count as usize | ||
Simon Sapin
|
r47865 | } | ||
fn copy_map_iter(&self) -> CopyMapIter<'_> { | ||||
Simon Sapin
|
r48127 | Box::new(filter_map_results(self.iter_nodes(), move |node| { | ||
Ok(if let Some(source) = node.copy_source(self.on_disk)? { | ||||
Some((node.full_path(self.on_disk)?, source)) | ||||
Simon Sapin
|
r48126 | } else { | ||
None | ||||
}) | ||||
Simon Sapin
|
r47870 | })) | ||
Simon Sapin
|
r47865 | } | ||
Simon Sapin
|
r48126 | fn copy_map_contains_key( | ||
&self, | ||||
key: &HgPath, | ||||
) -> Result<bool, DirstateV2ParseError> { | ||||
Ok(if let Some(node) = self.get_node(key)? { | ||||
node.has_copy_source() | ||||
Simon Sapin
|
r47869 | } else { | ||
false | ||||
Simon Sapin
|
r48126 | }) | ||
Simon Sapin
|
r47865 | } | ||
Simon Sapin
|
r48126 | fn copy_map_get( | ||
&self, | ||||
key: &HgPath, | ||||
) -> Result<Option<&HgPath>, DirstateV2ParseError> { | ||||
if let Some(node) = self.get_node(key)? { | ||||
Simon Sapin
|
r48127 | if let Some(source) = node.copy_source(self.on_disk)? { | ||
Simon Sapin
|
r48126 | return Ok(Some(source)); | ||
} | ||||
} | ||||
Ok(None) | ||||
Simon Sapin
|
r47865 | } | ||
Simon Sapin
|
r48126 | fn copy_map_remove( | ||
&mut self, | ||||
key: &HgPath, | ||||
) -> Result<Option<HgPathBuf>, DirstateV2ParseError> { | ||||
Simon Sapin
|
r47874 | let count = &mut self.nodes_with_copy_source_count; | ||
Simon Sapin
|
r48481 | let unreachable_bytes = &mut self.unreachable_bytes; | ||
Ok(Self::get_node_mut( | ||||
self.on_disk, | ||||
unreachable_bytes, | ||||
&mut self.root, | ||||
key, | ||||
)? | ||||
.and_then(|node| { | ||||
if let Some(source) = &node.copy_source { | ||||
*count -= 1; | ||||
Self::count_dropped_path(unreachable_bytes, source); | ||||
} | ||||
node.copy_source.take().map(Cow::into_owned) | ||||
})) | ||||
Simon Sapin
|
r47865 | } | ||
fn copy_map_insert( | ||||
&mut self, | ||||
Simon Sapin
|
r47874 | key: HgPathBuf, | ||
value: HgPathBuf, | ||||
Simon Sapin
|
r48126 | ) -> Result<Option<HgPathBuf>, DirstateV2ParseError> { | ||
Simon Sapin
|
r47896 | let node = Self::get_or_insert_node( | ||
Simon Sapin
|
r48127 | self.on_disk, | ||
Simon Sapin
|
r48481 | &mut self.unreachable_bytes, | ||
Simon Sapin
|
r47896 | &mut self.root, | ||
&key, | ||||
WithBasename::to_cow_owned, | ||||
|_ancestor| {}, | ||||
Simon Sapin
|
r48126 | )?; | ||
Simon Sapin
|
r47874 | if node.copy_source.is_none() { | ||
self.nodes_with_copy_source_count += 1 | ||||
} | ||||
Simon Sapin
|
r48126 | Ok(node.copy_source.replace(value.into()).map(Cow::into_owned)) | ||
Simon Sapin
|
r47865 | } | ||
fn len(&self) -> usize { | ||||
Simon Sapin
|
r48058 | self.nodes_with_entry_count as usize | ||
Simon Sapin
|
r47865 | } | ||
Simon Sapin
|
r48126 | fn contains_key( | ||
&self, | ||||
key: &HgPath, | ||||
) -> Result<bool, DirstateV2ParseError> { | ||||
Ok(self.get(key)?.is_some()) | ||||
Simon Sapin
|
r47865 | } | ||
Simon Sapin
|
r48126 | fn get( | ||
&self, | ||||
key: &HgPath, | ||||
) -> Result<Option<DirstateEntry>, DirstateV2ParseError> { | ||||
Ok(if let Some(node) = self.get_node(key)? { | ||||
node.entry()? | ||||
} else { | ||||
None | ||||
}) | ||||
Simon Sapin
|
r47865 | } | ||
fn iter(&self) -> StateMapIter<'_> { | ||||
Simon Sapin
|
r48127 | Box::new(filter_map_results(self.iter_nodes(), move |node| { | ||
Simon Sapin
|
r48126 | Ok(if let Some(entry) = node.entry()? { | ||
Simon Sapin
|
r48127 | Some((node.full_path(self.on_disk)?, entry)) | ||
Simon Sapin
|
r48126 | } else { | ||
None | ||||
}) | ||||
Simon Sapin
|
r47870 | })) | ||
Simon Sapin
|
r47865 | } | ||
Simon Sapin
|
r48140 | |||
Simon Sapin
|
r48483 | fn iter_tracked_dirs( | ||
&mut self, | ||||
) -> Result< | ||||
Box< | ||||
dyn Iterator<Item = Result<&HgPath, DirstateV2ParseError>> | ||||
+ Send | ||||
+ '_, | ||||
>, | ||||
DirstateError, | ||||
> { | ||||
let on_disk = self.on_disk; | ||||
Ok(Box::new(filter_map_results( | ||||
self.iter_nodes(), | ||||
move |node| { | ||||
Ok(if node.tracked_descendants_count() > 0 { | ||||
Some(node.full_path(on_disk)?) | ||||
} else { | ||||
None | ||||
}) | ||||
}, | ||||
))) | ||||
} | ||||
fn debug_iter( | ||||
Simon Sapin
|
r48140 | &self, | ||
) -> Box< | ||||
dyn Iterator< | ||||
Item = Result< | ||||
Simon Sapin
|
r48483 | (&HgPath, (u8, i32, i32, i32)), | ||
Simon Sapin
|
r48140 | DirstateV2ParseError, | ||
>, | ||||
> + Send | ||||
+ '_, | ||||
> { | ||||
Simon Sapin
|
r48483 | Box::new(self.iter_nodes().map(move |node| { | ||
let node = node?; | ||||
let debug_tuple = if let Some(entry) = node.entry()? { | ||||
entry.debug_tuple() | ||||
} else if let Some(mtime) = node.cached_directory_mtime() { | ||||
(b' ', 0, -1, mtime.seconds() as i32) | ||||
Simon Sapin
|
r48140 | } else { | ||
Simon Sapin
|
r48483 | (b' ', 0, -1, -1) | ||
}; | ||||
Ok((node.full_path(self.on_disk)?, debug_tuple)) | ||||
Simon Sapin
|
r48140 | })) | ||
} | ||||
Simon Sapin
|
r47865 | } | ||