upstream/mercurial-mirror Commit - r52244:bbbfa00d

delta-find: remove the "candidate groups" layer...

marmoute -

r52244:bbbfa00d default

parent child

mercurial/revlogutils/deltas.py

0 +50 -49

		@@ -821,6 +821,7 b' class _PrevDeltaSearch(_BaseDeltaSearch)'
821	821	def _init_group(self):
822	822	self.current_stage = _STAGE_PREV
823	823	self.current_group = [self.target_rev - 1]
	824	self.tested.update(self.current_group)
824	825
825	826	def next_group(self, good_delta=None):
826	827	self.current_stage = _STAGE_FULL
		@@ -837,60 +838,60 b' class _DeltaSearch(_BaseDeltaSearch):'
837	838	# Why search for delta base if we cannot use a delta base ?
838	839	# also see issue6056
839	840	assert self.revlog.delta_config.general_delta
840		self._candidates_iterator = self._~~candidate~~_groups()
	841	self._candidates_iterator = self._refined_groups()
841	842	self._last_good = None
842		self.current_group = self._candidates_iterator.send(self._last_good)
	843	self._next_internal_group()
	844
	845	def _next_internal_group(self):
	846	# self._internal_group can be larger than self.current_group
	847	self._internal_idx = 0
	848	group = self._candidates_iterator.send(self._last_good)
	849	if group is not None:
	850	group = self._pre_filter_candidate_revs(group)
	851	self._internal_group = group
	852	if self._internal_group is None:
	853	self.current_group = None
	854	elif len(self._internal_group) == 0:
	855	self.next_group()
	856	else:
	857	chunk_size = self.revlog.delta_config.candidate_group_chunk_size
	858	if chunk_size > 0:
	859	self.current_group = self._internal_group[:chunk_size]
	860	self._internal_idx += chunk_size
	861	else:
	862	self.current_group = self._internal_group
	863	self._internal_idx += len(self.current_group)
	864
	865	self.tested.update(self.current_group)
843	866
844	867	def next_group(self, good_delta=None):
	868	old_good = self._last_good
845	869	if good_delta is not None:
846	870	self._last_good = good_delta.base
847		self.current_group = self._candidates_iterator.send(self._last_good)
848
849		def _candidate_groups(self):
850		"""Provides group of revision to be tested as delta base
851
852		This top level function focus on emitting groups with unique and
853		worthwhile content. See _raw_candidate_groups for details about the
854		group order.
855		"""
856		good = None
857
858		group_chunk_size = self.revlog.delta_config.candidate_group_chunk_size
859
860		tested = self.tested # prefetch for speed and code compactness
861		candidates = self._refined_groups()
862		while True:
863		temptative = candidates.send(good)
864		if temptative is None:
865		break
866		group = self._pre_filter_candidate_revs(temptative)
867		if group:
868		# When the size of the candidate group is big, it can result in
869		# a quite significant performance impact. To reduce this, we
870		# can send them in smaller batches until the new batch does not
871		# provide any improvements.
872		#
873		# This might reduce the overall efficiency of the compression
874		# in some corner cases, but that should also prevent very
875		# pathological cases from being an issue. (eg. 20 000
876		# candidates).
877		#
878		# XXX note that the ordering of the group becomes important as
879		# it now impacts the final result. The current order is
880		# unprocessed and can be improved.
881		if group_chunk_size == 0:
882		tested.update(group)
883		good = yield tuple(group)
884		else:
885		prev_good = good
886		for start in range(0, len(group), group_chunk_size):
887		sub_group = group[start : start + group_chunk_size]
888		tested.update(sub_group)
889		good = yield tuple(sub_group)
890		if prev_good == good:
891		break
892
893		yield None
	871	if (self._internal_idx < len(self._internal_group)) and (
	872	old_good != good_delta
	873	):
	874	# When the size of the candidate group is big, it can result in
	875	# a quite significant performance impact. To reduce this, we
	876	# can send them in smaller batches until the new batch does not
	877	# provide any improvements.
	878	#
	879	# This might reduce the overall efficiency of the compression
	880	# in some corner cases, but that should also prevent very
	881	# pathological cases from being an issue. (eg. 20 000
	882	# candidates).
	883	#
	884	# XXX note that the ordering of the group becomes important as
	885	# it now impacts the final result. The current order is
	886	# unprocessed and can be improved.
	887	next_idx = self._internal_idx + self._group_chunk_size
	888	self.current_group = self._internal_group[
	889	self._internal_idx : next_idx
	890	]
	891	self.tested.update(self.current_group)
	892	self._internal_idx = next_idx
	893	else:
	894	self._next_internal_group()
894	895
895	896	def _pre_filter_candidate_revs(self, temptative):
896	897	"""filter possible candidate before computing a delta

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages