##// END OF EJS Templates
tests: pass re.MULTILINE to re.sub as 'flags' - not in 'count' position...
tests: pass re.MULTILINE to re.sub as 'flags' - not in 'count' position This bug was caught by the new Python 3.13 warning: DeprecationWarning: 'count' is passed as positional argument

File last commit:

r52756:f4733654 default
r53000:4fbee56e stable
Show More
smartset.py
1141 lines | 33.6 KiB | text/x-python | PythonLexer
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 # smartset.py - data structure for revision set
#
Raphaël Gomès
contributor: change mentions of mpm to olivia...
r47575 # Copyright 2010 Olivia Mackall <olivia@selenic.com>
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 #
# This software may be used and distributed according to the terms of the
# GNU General Public License version 2 or any later version.
from . import (
Yuya Nishihara
py3: build repr() of smartset as bytes then convert to str...
r35919 encoding,
Yuya Nishihara
smartset: extract method to slice abstractsmartset...
r32819 error,
Yuya Nishihara
py3: build repr() of smartset as bytes then convert to str...
r35919 pycompat,
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 util,
)
Augie Fackler
formatting: blacken the codebase...
r43346 from .utils import stringutil
Yuya Nishihara
py3: build repr() of smartset as bytes then convert to str...
r35919
def _typename(o):
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 return pycompat.sysbytes(type(o).__name__).lstrip(b'_')
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881
Augie Fackler
formatting: blacken the codebase...
r43346
Gregory Szorc
py3: use class X: instead of class X(object):...
r49801 class abstractsmartset:
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 def __nonzero__(self):
"""True if the smartset is not empty"""
raise NotImplementedError()
Gregory Szorc
py3: add __bool__ to every class defining __nonzero__...
r31476 __bool__ = __nonzero__
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 def __contains__(self, rev):
"""provide fast membership testing"""
raise NotImplementedError()
def __iter__(self):
"""iterate the set in the order it is supposed to be iterated"""
raise NotImplementedError()
# Attributes containing a function to perform a fast iteration in a given
# direction. A smartset can have none, one, or both defined.
#
# Default value is None instead of a function returning None to avoid
# initializing an iterator just for testing if a fast method exists.
fastasc = None
fastdesc = None
def isascending(self):
"""True if the set will iterate in ascending order"""
raise NotImplementedError()
def isdescending(self):
"""True if the set will iterate in descending order"""
raise NotImplementedError()
def istopo(self):
"""True if the set will iterate in topographical order"""
raise NotImplementedError()
def min(self):
"""return the minimum element in the set"""
if self.fastasc is None:
v = min(self)
else:
for v in self.fastasc():
break
else:
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 raise ValueError(b'arg is an empty sequence')
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 self.min = lambda: v
return v
def max(self):
"""return the maximum element in the set"""
if self.fastdesc is None:
return max(self)
else:
for v in self.fastdesc():
break
else:
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 raise ValueError(b'arg is an empty sequence')
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 self.max = lambda: v
return v
def first(self):
"""return the first element in the set (user iteration perspective)
Return None if the set is empty"""
raise NotImplementedError()
def last(self):
"""return the last element in the set (user iteration perspective)
Return None if the set is empty"""
raise NotImplementedError()
def __len__(self):
"""return the length of the smartsets
This can be expensive on smartset that could be lazy otherwise."""
raise NotImplementedError()
def reverse(self):
"""reverse the expected iteration order"""
raise NotImplementedError()
Yuya Nishihara
smartset: fix default value of abstractsmartset.sort()...
r33072 def sort(self, reverse=False):
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 """get the set to iterate in an ascending or descending order"""
raise NotImplementedError()
def __and__(self, other):
"""Returns a new object with the intersection of the two collections.
This is part of the mandatory API for smartset."""
if isinstance(other, fullreposet):
return self
return self.filter(other.__contains__, condrepr=other, cache=False)
def __add__(self, other):
"""Returns a new object with the union of the two collections.
This is part of the mandatory API for smartset."""
return addset(self, other)
def __sub__(self, other):
"""Returns a new object with the substraction of the two collections.
This is part of the mandatory API for smartset."""
c = other.__contains__
Augie Fackler
formatting: blacken the codebase...
r43346 return self.filter(
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 lambda r: not c(r), condrepr=(b'<not %r>', other), cache=False
Augie Fackler
formatting: blacken the codebase...
r43346 )
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881
def filter(self, condition, condrepr=None, cache=True):
"""Returns this smartset filtered by condition as a new smartset.
`condition` is a callable which takes a revision number and returns a
boolean. Optional `condrepr` provides a printable representation of
the given `condition`.
This is part of the mandatory API for smartset."""
# builtin cannot be cached. but do not needs to
safehasattr: drop usage in favor of hasattr...
r51821 if cache and hasattr(condition, '__code__'):
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 condition = util.cachefunc(condition)
return filteredset(self, condition, condrepr)
Yuya Nishihara
smartset: extract method to slice abstractsmartset...
r32819 def slice(self, start, stop):
"""Return new smartset that contains selected elements from this set"""
if start < 0 or stop < 0:
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 raise error.ProgrammingError(b'negative index not allowed')
Yuya Nishihara
smartset: extract method to slice abstractsmartset...
r32819 return self._slice(start, stop)
def _slice(self, start, stop):
# sub classes may override this. start and stop must not be negative,
# but start > stop is allowed, which should be an empty set.
ys = []
it = iter(self)
Manuel Jacob
py3: replace `pycompat.xrange` by `range`
r50179 for x in range(start):
Yuya Nishihara
smartset: extract method to slice abstractsmartset...
r32819 y = next(it, None)
if y is None:
break
Manuel Jacob
py3: replace `pycompat.xrange` by `range`
r50179 for x in range(stop - start):
Yuya Nishihara
smartset: extract method to slice abstractsmartset...
r32819 y = next(it, None)
if y is None:
break
ys.append(y)
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 return baseset(ys, datarepr=(b'slice=%d:%d %r', start, stop, self))
Yuya Nishihara
smartset: extract method to slice abstractsmartset...
r32819
Augie Fackler
formatting: blacken the codebase...
r43346
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 class baseset(abstractsmartset):
"""Basic data structure that represents a revset and contains the basic
operation that it should be able to perform.
Every method in this class should be implemented by any smartset class.
Jun Wu
smartset: add some doctests...
r31019
This class could be constructed by an (unordered) set, or an (ordered)
list-like object. If a set is provided, it'll be sorted lazily.
>>> x = [4, 0, 7, 6]
>>> y = [5, 6, 7, 3]
Construct by a set:
>>> xs = baseset(set(x))
>>> ys = baseset(set(y))
>>> [list(i) for i in [xs + ys, xs & ys, xs - ys]]
[[0, 4, 6, 7, 3, 5], [6, 7], [0, 4]]
>>> [type(i).__name__ for i in [xs + ys, xs & ys, xs - ys]]
Jun Wu
smartset: use native set operations as fast paths...
r31020 ['addset', 'baseset', 'baseset']
Jun Wu
smartset: add some doctests...
r31019
Construct by a list-like:
>>> xs = baseset(x)
>>> ys = baseset(i for i in y)
>>> [list(i) for i in [xs + ys, xs & ys, xs - ys]]
[[4, 0, 7, 6, 5, 3], [7, 6], [4, 0]]
>>> [type(i).__name__ for i in [xs + ys, xs & ys, xs - ys]]
['addset', 'filteredset', 'filteredset']
Populate "_set" fields in the lists so set optimization may be used:
>>> [1 in xs, 3 in ys]
[False, True]
Without sort(), results won't be changed:
>>> [list(i) for i in [xs + ys, xs & ys, xs - ys]]
[[4, 0, 7, 6, 5, 3], [7, 6], [4, 0]]
>>> [type(i).__name__ for i in [xs + ys, xs & ys, xs - ys]]
['addset', 'filteredset', 'filteredset']
Jun Wu
smartset: use native set operations as fast paths...
r31020 With sort(), set optimization could be used:
Jun Wu
smartset: add some doctests...
r31019 >>> xs.sort(reverse=True)
>>> [list(i) for i in [xs + ys, xs & ys, xs - ys]]
[[7, 6, 4, 0, 5, 3], [7, 6], [4, 0]]
>>> [type(i).__name__ for i in [xs + ys, xs & ys, xs - ys]]
Jun Wu
smartset: use native set operations as fast paths...
r31020 ['addset', 'baseset', 'baseset']
Jun Wu
smartset: add some doctests...
r31019
>>> ys.sort()
>>> [list(i) for i in [xs + ys, xs & ys, xs - ys]]
[[7, 6, 4, 0, 3, 5], [7, 6], [4, 0]]
>>> [type(i).__name__ for i in [xs + ys, xs & ys, xs - ys]]
Jun Wu
smartset: use native set operations as fast paths...
r31020 ['addset', 'baseset', 'baseset']
Jun Wu
smartset: preserve istopo for baseset operations...
r31066
istopo is preserved across set operations
>>> xs = baseset(set(x), istopo=True)
>>> rs = xs & ys
>>> type(rs).__name__
'baseset'
>>> rs._istopo
True
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 """
Augie Fackler
formatting: blacken the codebase...
r43346
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 def __init__(self, data=(), datarepr=None, istopo=False):
"""
datarepr: a tuple of (format, obj, ...), a function or an object that
provides a printable representation of the given data.
"""
self._ascending = None
self._istopo = istopo
Yuya Nishihara
smartset: reorder initialization of baseset in more intuitive way...
r31127 if isinstance(data, set):
# converting set to list has a cost, do it lazily
self._set = data
# set has no order we pick one for stability purpose
self._ascending = True
else:
if not isinstance(data, list):
Jun Wu
smartset: convert set to list lazily...
r31015 data = list(data)
self._list = data
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 self._datarepr = datarepr
@util.propertycache
def _set(self):
return set(self._list)
@util.propertycache
def _asclist(self):
asclist = self._list[:]
asclist.sort()
return asclist
Jun Wu
smartset: convert set to list lazily...
r31015 @util.propertycache
def _list(self):
# _list is only lazily constructed if we have _set
Augie Fackler
cleanup: remove pointless r-prefixes on single-quoted strings...
r43906 assert '_set' in self.__dict__
Jun Wu
smartset: convert set to list lazily...
r31015 return list(self._set)
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 def __iter__(self):
if self._ascending is None:
return iter(self._list)
elif self._ascending:
return iter(self._asclist)
else:
return reversed(self._asclist)
def fastasc(self):
return iter(self._asclist)
def fastdesc(self):
return reversed(self._asclist)
@util.propertycache
def __contains__(self):
return self._set.__contains__
def __nonzero__(self):
Jun Wu
smartset: convert set to list lazily...
r31015 return bool(len(self))
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881
Gregory Szorc
py3: add __bool__ to every class defining __nonzero__...
r31476 __bool__ = __nonzero__
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 def sort(self, reverse=False):
self._ascending = not bool(reverse)
self._istopo = False
def reverse(self):
if self._ascending is None:
self._list.reverse()
else:
self._ascending = not self._ascending
self._istopo = False
def __len__(self):
Augie Fackler
cleanup: remove pointless r-prefixes on single-quoted strings...
r43906 if '_list' in self.__dict__:
Jun Wu
smartset: convert set to list lazily...
r31015 return len(self._list)
else:
return len(self._set)
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881
def isascending(self):
"""Returns True if the collection is ascending order, False if not.
This is part of the mandatory API for smartset."""
if len(self) <= 1:
return True
return self._ascending is not None and self._ascending
def isdescending(self):
"""Returns True if the collection is descending order, False if not.
This is part of the mandatory API for smartset."""
if len(self) <= 1:
return True
return self._ascending is not None and not self._ascending
def istopo(self):
"""Is the collection is in topographical order or not.
This is part of the mandatory API for smartset."""
if len(self) <= 1:
return True
return self._istopo
def first(self):
if self:
if self._ascending is None:
return self._list[0]
elif self._ascending:
return self._asclist[0]
else:
return self._asclist[-1]
return None
def last(self):
if self:
if self._ascending is None:
return self._list[-1]
elif self._ascending:
return self._asclist[-1]
else:
return self._asclist[0]
return None
Jun Wu
smartset: use native set operations as fast paths...
r31020 def _fastsetop(self, other, op):
# try to use native set operations as fast paths
Augie Fackler
formatting: blacken the codebase...
r43346 if (
type(other) is baseset
Augie Fackler
cleanup: remove pointless r-prefixes on single-quoted strings...
r43906 and '_set' in other.__dict__
and '_set' in self.__dict__
Augie Fackler
formatting: blacken the codebase...
r43346 and self._ascending is not None
):
s = baseset(
data=getattr(self._set, op)(other._set), istopo=self._istopo
)
Jun Wu
smartset: use native set operations as fast paths...
r31020 s._ascending = self._ascending
else:
s = getattr(super(baseset, self), op)(other)
return s
def __and__(self, other):
smartset: set attribute using sysstr instead of bytes...
r51805 return self._fastsetop(other, '__and__')
Jun Wu
smartset: use native set operations as fast paths...
r31020
def __sub__(self, other):
smartset: set attribute using sysstr instead of bytes...
r51805 return self._fastsetop(other, '__sub__')
Jun Wu
smartset: use native set operations as fast paths...
r31020
Yuya Nishihara
smartset: micro optimize baseset.slice() to use slice of list...
r32820 def _slice(self, start, stop):
# creating new list should be generally cheaper than iterating items
if self._ascending is None:
return baseset(self._list[start:stop], istopo=self._istopo)
data = self._asclist
if not self._ascending:
start, stop = max(len(data) - stop, 0), max(len(data) - start, 0)
s = baseset(data[start:stop], istopo=self._istopo)
s._ascending = self._ascending
return s
Yuya Nishihara
py3: build repr() of smartset as bytes then convert to str...
r35919 @encoding.strmethod
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 def __repr__(self):
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 d = {None: b'', False: b'-', True: b'+'}[self._ascending]
Yuya Nishihara
stringutil: move _formatsetrepr() from smartset...
r38595 s = stringutil.buildrepr(self._datarepr)
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 if not s:
l = self._list
# if _list has been built from a set, it might have a different
# order from one python implementation to another.
# We fallback to the sorted version for a stable output.
if self._ascending is not None:
l = self._asclist
Yuya Nishihara
py3: factor out byterepr() which returns an asciified value on py3
r36279 s = pycompat.byterepr(l)
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 return b'<%s%s %s>' % (_typename(self), d, s)
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881
Augie Fackler
formatting: blacken the codebase...
r43346
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 class filteredset(abstractsmartset):
"""Duck type for baseset class which iterates lazily over the revisions in
the subset and contains a function which tests for membership in the
revset
"""
Augie Fackler
formatting: blacken the codebase...
r43346
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 def __init__(self, subset, condition=lambda x: True, condrepr=None):
"""
condition: a function that decide whether a revision in the subset
belongs to the revset or not.
condrepr: a tuple of (format, obj, ...), a function or an object that
provides a printable representation of the given condition.
"""
self._subset = subset
self._condition = condition
self._condrepr = condrepr
def __contains__(self, x):
return x in self._subset and self._condition(x)
def __iter__(self):
return self._iterfilter(self._subset)
def _iterfilter(self, it):
cond = self._condition
for x in it:
if cond(x):
yield x
@property
def fastasc(self):
it = self._subset.fastasc
if it is None:
return None
return lambda: self._iterfilter(it())
@property
def fastdesc(self):
it = self._subset.fastdesc
if it is None:
return None
return lambda: self._iterfilter(it())
def __nonzero__(self):
fast = None
Augie Fackler
formatting: blacken the codebase...
r43346 candidates = [
self.fastasc if self.isascending() else None,
self.fastdesc if self.isdescending() else None,
self.fastasc,
self.fastdesc,
]
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 for candidate in candidates:
if candidate is not None:
fast = candidate
break
if fast is not None:
it = fast()
else:
it = self
for r in it:
return True
return False
Gregory Szorc
py3: add __bool__ to every class defining __nonzero__...
r31476 __bool__ = __nonzero__
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 def __len__(self):
# Basic implementation to be changed in future patches.
# until this gets improved, we use generator expression
# here, since list comprehensions are free to call __len__ again
# causing infinite recursion
l = baseset(r for r in self)
return len(l)
def sort(self, reverse=False):
self._subset.sort(reverse=reverse)
def reverse(self):
self._subset.reverse()
def isascending(self):
return self._subset.isascending()
def isdescending(self):
return self._subset.isdescending()
def istopo(self):
return self._subset.istopo()
def first(self):
for x in self:
return x
return None
def last(self):
it = None
if self.isascending():
it = self.fastdesc
elif self.isdescending():
it = self.fastasc
if it is not None:
for x in it():
return x
Augie Fackler
formatting: blacken the codebase...
r43346 return None # empty case
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 else:
x = None
for x in self:
pass
return x
Yuya Nishihara
py3: build repr() of smartset as bytes then convert to str...
r35919 @encoding.strmethod
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 def __repr__(self):
Yuya Nishihara
py3: factor out byterepr() which returns an asciified value on py3
r36279 xs = [pycompat.byterepr(self._subset)]
Yuya Nishihara
stringutil: move _formatsetrepr() from smartset...
r38595 s = stringutil.buildrepr(self._condrepr)
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 if s:
xs.append(s)
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 return b'<%s %s>' % (_typename(self), b', '.join(xs))
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881
Augie Fackler
formatting: blacken the codebase...
r43346
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 def _iterordered(ascending, iter1, iter2):
"""produce an ordered iteration from two iterators with the same order
The ascending is used to indicated the iteration direction.
"""
choice = max
if ascending:
choice = min
val1 = None
val2 = None
try:
# Consume both iterators in an ordered way until one is empty
while True:
if val1 is None:
val1 = next(iter1)
if val2 is None:
val2 = next(iter2)
n = choice(val1, val2)
yield n
if val1 == n:
val1 = None
if val2 == n:
val2 = None
except StopIteration:
# Flush any remaining values and consume the other one
it = iter2
if val1 is not None:
yield val1
it = iter1
elif val2 is not None:
# might have been equality and both are empty
yield val2
for val in it:
yield val
Augie Fackler
formatting: blacken the codebase...
r43346
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 class addset(abstractsmartset):
"""Represent the addition of two sets
Wrapper structure for lazily adding two structures without losing much
performance on the __contains__ method
If the ascending attribute is set, that means the two structures are
ordered in either an ascending or descending way. Therefore, we can add
them maintaining the order by iterating over both at the same time
>>> xs = baseset([0, 3, 2])
>>> ys = baseset([5, 2, 4])
>>> rs = addset(xs, ys)
>>> bool(rs), 0 in rs, 1 in rs, 5 in rs, rs.first(), rs.last()
(True, True, False, True, 0, 4)
>>> rs = addset(xs, baseset([]))
>>> bool(rs), 0 in rs, 1 in rs, rs.first(), rs.last()
(True, True, False, 0, 2)
>>> rs = addset(baseset([]), baseset([]))
>>> bool(rs), 0 in rs, rs.first(), rs.last()
(False, False, None, None)
iterate unsorted:
>>> rs = addset(xs, ys)
>>> # (use generator because pypy could call len())
>>> list(x for x in rs) # without _genlist
[0, 3, 2, 5, 4]
>>> assert not rs._genlist
>>> len(rs)
5
>>> [x for x in rs] # with _genlist
[0, 3, 2, 5, 4]
>>> assert rs._genlist
iterate ascending:
>>> rs = addset(xs, ys, ascending=True)
>>> # (use generator because pypy could call len())
>>> list(x for x in rs), list(x for x in rs.fastasc()) # without _asclist
([0, 2, 3, 4, 5], [0, 2, 3, 4, 5])
>>> assert not rs._asclist
>>> len(rs)
5
>>> [x for x in rs], [x for x in rs.fastasc()]
([0, 2, 3, 4, 5], [0, 2, 3, 4, 5])
>>> assert rs._asclist
iterate descending:
>>> rs = addset(xs, ys, ascending=False)
>>> # (use generator because pypy could call len())
>>> list(x for x in rs), list(x for x in rs.fastdesc()) # without _asclist
([5, 4, 3, 2, 0], [5, 4, 3, 2, 0])
>>> assert not rs._asclist
>>> len(rs)
5
>>> [x for x in rs], [x for x in rs.fastdesc()]
([5, 4, 3, 2, 0], [5, 4, 3, 2, 0])
>>> assert rs._asclist
iterate ascending without fastasc:
>>> rs = addset(xs, generatorset(ys), ascending=True)
>>> assert rs.fastasc is None
>>> [x for x in rs]
[0, 2, 3, 4, 5]
iterate descending without fastdesc:
>>> rs = addset(generatorset(xs), ys, ascending=False)
>>> assert rs.fastdesc is None
>>> [x for x in rs]
[5, 4, 3, 2, 0]
"""
Augie Fackler
formatting: blacken the codebase...
r43346
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 def __init__(self, revs1, revs2, ascending=None):
self._r1 = revs1
self._r2 = revs2
self._iter = None
self._ascending = ascending
self._genlist = None
self._asclist = None
def __len__(self):
return len(self._list)
def __nonzero__(self):
return bool(self._r1) or bool(self._r2)
Gregory Szorc
py3: add __bool__ to every class defining __nonzero__...
r31476 __bool__ = __nonzero__
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 @util.propertycache
def _list(self):
if not self._genlist:
self._genlist = baseset(iter(self))
return self._genlist
def __iter__(self):
"""Iterate over both collections without repeating elements
If the ascending attribute is not set, iterate over the first one and
then over the second one checking for membership on the first one so we
dont yield any duplicates.
If the ascending attribute is set, iterate over both collections at the
same time, yielding only one value at a time in the given order.
"""
if self._ascending is None:
if self._genlist:
return iter(self._genlist)
Augie Fackler
formatting: blacken the codebase...
r43346
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 def arbitraryordergen():
for r in self._r1:
yield r
inr1 = self._r1.__contains__
for r in self._r2:
if not inr1(r):
yield r
Augie Fackler
formatting: blacken the codebase...
r43346
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 return arbitraryordergen()
# try to use our own fast iterator if it exists
self._trysetasclist()
if self._ascending:
safehasattr: pass attribute name as string instead of bytes...
r51491 attr = 'fastasc'
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 else:
safehasattr: pass attribute name as string instead of bytes...
r51492 attr = 'fastdesc'
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 it = getattr(self, attr)
if it is not None:
return it()
# maybe half of the component supports fast
# get iterator for _r1
iter1 = getattr(self._r1, attr)
if iter1 is None:
# let's avoid side effect (not sure it matters)
iter1 = iter(sorted(self._r1, reverse=not self._ascending))
else:
iter1 = iter1()
# get iterator for _r2
iter2 = getattr(self._r2, attr)
if iter2 is None:
# let's avoid side effect (not sure it matters)
iter2 = iter(sorted(self._r2, reverse=not self._ascending))
else:
iter2 = iter2()
return _iterordered(self._ascending, iter1, iter2)
def _trysetasclist(self):
"""populate the _asclist attribute if possible and necessary"""
if self._genlist is not None and self._asclist is None:
self._asclist = sorted(self._genlist)
@property
def fastasc(self):
self._trysetasclist()
if self._asclist is not None:
return self._asclist.__iter__
iter1 = self._r1.fastasc
iter2 = self._r2.fastasc
if None in (iter1, iter2):
return None
return lambda: _iterordered(True, iter1(), iter2())
@property
def fastdesc(self):
self._trysetasclist()
if self._asclist is not None:
return self._asclist.__reversed__
iter1 = self._r1.fastdesc
iter2 = self._r2.fastdesc
if None in (iter1, iter2):
return None
return lambda: _iterordered(False, iter1(), iter2())
def __contains__(self, x):
return x in self._r1 or x in self._r2
def sort(self, reverse=False):
"""Sort the added set
For this we use the cached list with all the generated values and if we
know they are ascending or descending we can sort them in a smart way.
"""
self._ascending = not reverse
def isascending(self):
return self._ascending is not None and self._ascending
def isdescending(self):
return self._ascending is not None and not self._ascending
def istopo(self):
# not worth the trouble asserting if the two sets combined are still
# in topographical order. Use the sort() predicate to explicitly sort
# again instead.
return False
def reverse(self):
if self._ascending is None:
self._list.reverse()
else:
self._ascending = not self._ascending
def first(self):
for x in self:
return x
return None
def last(self):
self.reverse()
val = self.first()
self.reverse()
return val
Yuya Nishihara
py3: build repr() of smartset as bytes then convert to str...
r35919 @encoding.strmethod
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 def __repr__(self):
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 d = {None: b'', False: b'-', True: b'+'}[self._ascending]
return b'<%s%s %r, %r>' % (_typename(self), d, self._r1, self._r2)
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881
Augie Fackler
formatting: blacken the codebase...
r43346
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 class generatorset(abstractsmartset):
"""Wrap a generator for lazy iteration
Wrapper structure for generators that provides lazy membership and can
be iterated more than once.
When asked for membership it generates values until either it finds the
requested one or has gone through all the elements in the generator
Yuya Nishihara
smartset: fix generatorset.last() to not return the first element (issue5609)
r33109
>>> xs = generatorset([0, 1, 4], iterasc=True)
>>> assert xs.last() == xs.last()
>>> xs.last() # cached
4
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 """
Augie Fackler
formatting: blacken the codebase...
r43346
Gregory Szorc
smartset: split generatorset classes to avoid cycle...
r35517 def __new__(cls, gen, iterasc=None):
if iterasc is None:
typ = cls
elif iterasc:
typ = _generatorsetasc
else:
typ = _generatorsetdesc
return super(generatorset, cls).__new__(typ)
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 def __init__(self, gen, iterasc=None):
"""
gen: a generator producing the values for the generatorset.
"""
self._gen = gen
self._asclist = None
self._cache = {}
self._genlist = []
self._finished = False
self._ascending = True
def __nonzero__(self):
# Do not use 'for r in self' because it will enforce the iteration
# order (default ascending), possibly unrolling a whole descending
# iterator.
if self._genlist:
return True
for r in self._consumegen():
return True
return False
Gregory Szorc
py3: add __bool__ to every class defining __nonzero__...
r31476 __bool__ = __nonzero__
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 def __contains__(self, x):
if x in self._cache:
return self._cache[x]
# Use new values only, as existing values would be cached.
for l in self._consumegen():
if l == x:
return True
self._cache[x] = False
return False
def __iter__(self):
if self._ascending:
it = self.fastasc
else:
it = self.fastdesc
if it is not None:
return it()
# we need to consume the iterator
for x in self._consumegen():
pass
# recall the same code
return iter(self)
def _iterator(self):
if self._finished:
return iter(self._genlist)
# We have to use this complex iteration strategy to allow multiple
# iterations at the same time. We need to be able to catch revision
# removed from _consumegen and added to genlist in another instance.
#
# Getting rid of it would provide an about 15% speed up on this
# iteration.
genlist = self._genlist
Yuya Nishihara
py3: use next() to obtain next item from inner generator of generatorset...
r31446 nextgen = self._consumegen()
Augie Fackler
formatting: blacken the codebase...
r43346 _len, _next = len, next # cache global lookup
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 def gen():
i = 0
while True:
if i < _len(genlist):
yield genlist[i]
else:
Martin von Zweigbergk
py3: catch StopIteration from next() in generatorset...
r32977 try:
yield _next(nextgen)
except StopIteration:
return
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 i += 1
Augie Fackler
formatting: blacken the codebase...
r43346
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 return gen()
def _consumegen(self):
cache = self._cache
genlist = self._genlist.append
for item in self._gen:
cache[item] = True
genlist(item)
yield item
if not self._finished:
self._finished = True
asc = self._genlist[:]
asc.sort()
self._asclist = asc
self.fastasc = asc.__iter__
self.fastdesc = asc.__reversed__
def __len__(self):
for x in self._consumegen():
pass
return len(self._genlist)
def sort(self, reverse=False):
self._ascending = not reverse
def reverse(self):
self._ascending = not self._ascending
def isascending(self):
return self._ascending
def isdescending(self):
return not self._ascending
def istopo(self):
# not worth the trouble asserting if the two sets combined are still
# in topographical order. Use the sort() predicate to explicitly sort
# again instead.
return False
def first(self):
if self._ascending:
it = self.fastasc
else:
it = self.fastdesc
if it is None:
# we need to consume all and try again
for x in self._consumegen():
pass
return self.first()
return next(it(), None)
def last(self):
if self._ascending:
it = self.fastdesc
else:
it = self.fastasc
if it is None:
# we need to consume all and try again
for x in self._consumegen():
pass
Yuya Nishihara
smartset: fix generatorset.last() to not return the first element (issue5609)
r33109 return self.last()
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 return next(it(), None)
Yuya Nishihara
py3: build repr() of smartset as bytes then convert to str...
r35919 @encoding.strmethod
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 def __repr__(self):
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 d = {False: b'-', True: b'+'}[self._ascending]
return b'<%s%s>' % (_typename(self), d)
Gregory Szorc
smartset: split generatorset classes to avoid cycle...
r35517
Augie Fackler
formatting: blacken the codebase...
r43346
Gregory Szorc
smartset: split generatorset classes to avoid cycle...
r35517 class _generatorsetasc(generatorset):
"""Special case of generatorset optimized for ascending generators."""
fastasc = generatorset._iterator
def __contains__(self, x):
if x in self._cache:
return self._cache[x]
# Use new values only, as existing values would be cached.
for l in self._consumegen():
if l == x:
return True
if l > x:
break
self._cache[x] = False
return False
Augie Fackler
formatting: blacken the codebase...
r43346
Gregory Szorc
smartset: split generatorset classes to avoid cycle...
r35517 class _generatorsetdesc(generatorset):
"""Special case of generatorset optimized for descending generators."""
fastdesc = generatorset._iterator
def __contains__(self, x):
if x in self._cache:
return self._cache[x]
# Use new values only, as existing values would be cached.
for l in self._consumegen():
if l == x:
return True
if l < x:
break
self._cache[x] = False
return False
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881
Augie Fackler
formatting: blacken the codebase...
r43346
Yuya Nishihara
smartset: extract spanset factory to make it constructed without a repo...
r32818 def spanset(repo, start=0, end=None):
"""Create a spanset that represents a range of repository revisions
start: first revision included the set (default to 0)
end: first revision excluded (last+1) (default to len(repo))
Spanset will be descending if `end` < `start`.
"""
if end is None:
end = len(repo)
ascending = start <= end
if not ascending:
start, end = end + 1, start + 1
return _spanset(start, end, ascending, repo.changelog.filteredrevs)
Augie Fackler
formatting: blacken the codebase...
r43346
Yuya Nishihara
smartset: extract spanset factory to make it constructed without a repo...
r32818 class _spanset(abstractsmartset):
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 """Duck type for baseset class which represents a range of revisions and
can work lazily and without having all the range in memory
Manuel Jacob
py3: replace mention of “xrange” in docstring by “range”
r50181 Note that spanset(x, y) behave almost like range(x, y) except for two
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 notable points:
- when x < y it will be automatically descending,
- revision filtered with this repoview will be skipped.
"""
Augie Fackler
formatting: blacken the codebase...
r43346
Yuya Nishihara
smartset: extract spanset factory to make it constructed without a repo...
r32818 def __init__(self, start, end, ascending, hiddenrevs):
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 self._start = start
self._end = end
Yuya Nishihara
smartset: extract spanset factory to make it constructed without a repo...
r32818 self._ascending = ascending
self._hiddenrevs = hiddenrevs
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881
def sort(self, reverse=False):
self._ascending = not reverse
def reverse(self):
self._ascending = not self._ascending
def istopo(self):
# not worth the trouble asserting if the two sets combined are still
# in topographical order. Use the sort() predicate to explicitly sort
# again instead.
return False
def _iterfilter(self, iterrange):
s = self._hiddenrevs
for r in iterrange:
if r not in s:
yield r
def __iter__(self):
if self._ascending:
return self.fastasc()
else:
return self.fastdesc()
def fastasc(self):
Manuel Jacob
py3: replace `pycompat.xrange` by `range`
r50179 iterrange = range(self._start, self._end)
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 if self._hiddenrevs:
return self._iterfilter(iterrange)
return iter(iterrange)
def fastdesc(self):
Manuel Jacob
py3: replace `pycompat.xrange` by `range`
r50179 iterrange = range(self._end - 1, self._start - 1, -1)
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 if self._hiddenrevs:
return self._iterfilter(iterrange)
return iter(iterrange)
def __contains__(self, rev):
hidden = self._hiddenrevs
Augie Fackler
formatting: blacken the codebase...
r43346 return (self._start <= rev < self._end) and not (
hidden and rev in hidden
)
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881
def __nonzero__(self):
for r in self:
return True
return False
Gregory Szorc
py3: add __bool__ to every class defining __nonzero__...
r31476 __bool__ = __nonzero__
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 def __len__(self):
if not self._hiddenrevs:
return abs(self._end - self._start)
else:
count = 0
start = self._start
end = self._end
for rev in self._hiddenrevs:
if (end < rev <= start) or (start <= rev < end):
count += 1
return abs(self._end - self._start) - count
def isascending(self):
return self._ascending
def isdescending(self):
return not self._ascending
def first(self):
if self._ascending:
it = self.fastasc
else:
it = self.fastdesc
for x in it():
return x
return None
def last(self):
if self._ascending:
it = self.fastdesc
else:
it = self.fastasc
for x in it():
return x
return None
Yuya Nishihara
smartset: micro optimize spanset.slice() to narrow range accordingly...
r32821 def _slice(self, start, stop):
if self._hiddenrevs:
# unoptimized since all hidden revisions in range has to be scanned
return super(_spanset, self)._slice(start, stop)
if self._ascending:
x = min(self._start + start, self._end)
y = min(self._start + stop, self._end)
else:
x = max(self._end - stop, self._start)
y = max(self._end - start, self._start)
return _spanset(x, y, self._ascending, self._hiddenrevs)
Yuya Nishihara
py3: build repr() of smartset as bytes then convert to str...
r35919 @encoding.strmethod
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 def __repr__(self):
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 d = {False: b'-', True: b'+'}[self._ascending]
return b'<%s%s %d:%d>' % (_typename(self), d, self._start, self._end)
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881
Augie Fackler
formatting: blacken the codebase...
r43346
Yuya Nishihara
smartset: extract spanset factory to make it constructed without a repo...
r32818 class fullreposet(_spanset):
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 """a set containing all revisions in the repo
This class exists to host special optimization and magic to handle virtual
revisions such as "null".
"""
def __init__(self, repo):
Augie Fackler
formatting: blacken the codebase...
r43346 super(fullreposet, self).__init__(
0, len(repo), True, repo.changelog.filteredrevs
)
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881
def __and__(self, other):
"""As self contains the whole repo, all of the other set should also be
in self. Therefore `self & other = other`.
This boldly assumes the other contains valid revs only.
"""
# other not a smartset, make is so
safehasattr: drop usage in favor of hasattr...
r51821 if not hasattr(other, 'isascending'):
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881 # filter out hidden revision
# (this boldly assumes all smartset are pure)
#
# `other` was used with "&", let's assume this is a set like
# object.
Martin von Zweigbergk
smartset: don't ignore hidden revs when intersecting...
r52004 other = baseset(other)
if self._hiddenrevs:
other = other - self._hiddenrevs
Yuya Nishihara
smartset: move set classes and related functions from revset module (API)...
r30881
other.sort(reverse=self.isdescending())
return other