upstream/mercurial-mirror Files · rust/hg-core/src/lib.rs

copies: do full filtering at end of _changesetforwardcopies()...

copies: do full filtering at end of _changesetforwardcopies() As mentioned earlier, pathcopies() is very slow when copies are stored in the changeset. Most of the cost comes from calling _chain() for every changeset, which is slow because it needs to read manifests. It needs to read manifests to be able to filter out copies that are were created in one commit and then deleted. (It also filters out copies that were created from a file that didn't exist in the starting revision, but that's a fixed revision across calls to _chain(), so it's much cheaper.) This patch changes from _chainandfilter() to just _chain() in the main loop in _changesetforwardcopies(). It instead removes copies that have subsequently been removed by using ctx.filesremoved(). We thus rely on that to be fast. It timed this command in mozilla-unified: hg debugpathcopies FIREFOX_59_0b3_BUILD2 FIREFOX_BETA_59_END It took 18s before and 1.1s after. It's still faster when copy information is stored in filelogs: 0.70s. It also still gets slow when there are merge commits involved, because we read manifests there too. We'll deal with that later. Differential Revision: https://phab.mercurial-scm.org/D6419

Raphaël Gomès - - Load All Authors

File last commit:

r42630:9609430d default


                r42685:4c39c99d

default

Download file

             lib.rs
        
                    103 lines
            
             | 2.7 KiB
            
                | application/rls-services+xml
            
             |
                RustLexer
            
             / rust / hg-core / src / lib.rs
          
                    History
                
                 |
                  Annotation
                 | Raw
                 |Copy content
                 |Copy permalink

      // Copyright 2018 Georges Racinet <gracinet@anybox.fr>

      //

      // This software may be used and distributed according to the terms of the

      // GNU General Public License version 2 or any later version.

      extern crate byteorder;

      extern crate memchr;

      #[macro_use]

      extern crate lazy_static;

      extern crate regex;

      mod ancestors;

      pub mod dagops;

      pub use ancestors::{AncestorsIterator, LazyAncestors, MissingAncestors};

      mod dirstate;

      pub mod discovery;

      pub mod testing; // unconditionally built, for use from integration tests

      pub use dirstate::{

          parsers::{pack_dirstate, parse_dirstate},

          CopyVec, CopyVecEntry, DirstateEntry, DirstateParents, DirstateVec,

      };

      mod filepatterns;

      mod utils;

      pub use filepatterns::{

          build_single_regex, read_pattern_file, PatternSyntax, PatternTuple,

      };

      /// Mercurial revision numbers

      ///

      /// As noted in revlog.c, revision numbers are actually encoded in

      /// 4 bytes, and are liberally converted to ints, whence the i32

      pub type Revision = i32;

      /// Marker expressing the absence of a parent

      ///

      /// Independently of the actual representation, `NULL_REVISION` is guaranteed

      /// to be smaller that all existing revisions.

      pub const NULL_REVISION: Revision = -1;

      /// Same as `mercurial.node.wdirrev`

      ///

      /// This is also equal to `i32::max_value()`, but it's better to spell

      /// it out explicitely, same as in `mercurial.node`

      pub const WORKING_DIRECTORY_REVISION: Revision = 0x7fffffff;

      /// The simplest expression of what we need of Mercurial DAGs.

      pub trait Graph {

          /// Return the two parents of the given `Revision`.

          ///

          /// Each of the parents can be independently `NULL_REVISION`

          fn parents(&self, Revision) -> Result<[Revision; 2], GraphError>;

      }

      pub type LineNumber = usize;

      #[derive(Clone, Debug, PartialEq)]

      pub enum GraphError {

          ParentOutOfRange(Revision),

          WorkingDirectoryUnsupported,

      }

      #[derive(Clone, Debug, PartialEq)]

      pub enum DirstateParseError {

          TooLittleData,

          Overflow,

          CorruptedEntry(String),

      }

      #[derive(Debug, PartialEq)]

      pub enum DirstatePackError {

          CorruptedEntry(String),

          CorruptedParent,

          BadSize(usize, usize),

      }

      impl From<std::io::Error> for DirstatePackError {

          fn from(e: std::io::Error) -> Self {

              DirstatePackError::CorruptedEntry(e.to_string())

          }

      }

      impl From<std::io::Error> for DirstateParseError {

          fn from(e: std::io::Error) -> Self {

              DirstateParseError::CorruptedEntry(e.to_string())

          }

      }

      #[derive(Debug)]

      pub enum PatternError {

          UnsupportedSyntax(String),

      }

      #[derive(Debug)]

      pub enum PatternFileError {

          IO(std::io::Error),

          Pattern(PatternError, LineNumber),

      }

      impl From<std::io::Error> for PatternFileError {

          fn from(e: std::io::Error) -> Self {

              PatternFileError::IO(e)

          }

      }

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

				// Copyright 2018 Georges Racinet <gracinet@anybox.fr>
				//
				// This software may be used and distributed according to the terms of the
				// GNU General Public License version 2 or any later version.
				extern crate byteorder;
				extern crate memchr;
				#[macro_use]
				extern crate lazy_static;
				extern crate regex;

				mod ancestors;
				pub mod dagops;
				pub use ancestors::{AncestorsIterator, LazyAncestors, MissingAncestors};
				mod dirstate;
				pub mod discovery;
				pub mod testing; // unconditionally built, for use from integration tests
				pub use dirstate::{
				parsers::{pack_dirstate, parse_dirstate},
				CopyVec, CopyVecEntry, DirstateEntry, DirstateParents, DirstateVec,
				};
				mod filepatterns;
				mod utils;

				pub use filepatterns::{
				build_single_regex, read_pattern_file, PatternSyntax, PatternTuple,
				};

				/// Mercurial revision numbers
				///
				/// As noted in revlog.c, revision numbers are actually encoded in
				/// 4 bytes, and are liberally converted to ints, whence the i32
				pub type Revision = i32;

				/// Marker expressing the absence of a parent
				///
				/// Independently of the actual representation, `NULL_REVISION` is guaranteed
				/// to be smaller that all existing revisions.
				pub const NULL_REVISION: Revision = -1;

				/// Same as `mercurial.node.wdirrev`
				///
				/// This is also equal to `i32::max_value()`, but it's better to spell
				/// it out explicitely, same as in `mercurial.node`
				pub const WORKING_DIRECTORY_REVISION: Revision = 0x7fffffff;

				/// The simplest expression of what we need of Mercurial DAGs.
				pub trait Graph {
				/// Return the two parents of the given `Revision`.
				///
				/// Each of the parents can be independently `NULL_REVISION`
				fn parents(&self, Revision) -> Result<[Revision; 2], GraphError>;
				}

				pub type LineNumber = usize;

				#[derive(Clone, Debug, PartialEq)]
				pub enum GraphError {
				ParentOutOfRange(Revision),
				WorkingDirectoryUnsupported,
				}

				#[derive(Clone, Debug, PartialEq)]
				pub enum DirstateParseError {
				TooLittleData,
				Overflow,
				CorruptedEntry(String),
				}

				#[derive(Debug, PartialEq)]
				pub enum DirstatePackError {
				CorruptedEntry(String),
				CorruptedParent,
				BadSize(usize, usize),
				}

				impl From<std::io::Error> for DirstatePackError {
				fn from(e: std::io::Error) -> Self {
				DirstatePackError::CorruptedEntry(e.to_string())
				}
				}

				impl From<std::io::Error> for DirstateParseError {
				fn from(e: std::io::Error) -> Self {
				DirstateParseError::CorruptedEntry(e.to_string())
				}
				}

				#[derive(Debug)]
				pub enum PatternError {
				UnsupportedSyntax(String),
				}

				#[derive(Debug)]
				pub enum PatternFileError {
				IO(std::io::Error),
				Pattern(PatternError, LineNumber),
				}

				impl From<std::io::Error> for PatternFileError {
				fn from(e: std::io::Error) -> Self {
				PatternFileError::IO(e)
				}
				}