upstream/mercurial-mirror Files · mercurial/repocache.py

nodemap: track the maximum revision tracked in the nodemap...

nodemap: track the maximum revision tracked in the nodemap We need a simple way to detect when the on disk data contains less revision than the index we read from disk. The docket file is meant for this, we just had to start tracking that data. We should also try to detect strip operation, but we will deal with this in later changesets. Right now we are focusing on defining the API for index supporting persistent nodemap. Differential Revision: https://phab.mercurial-scm.org/D7888

Martin von Zweigbergk - - Load All Authors

File last commit:

r43387:8ff1ecfa default


                r44807:e41a164d

default

Download file

             repocache.py
        
                    139 lines
            
             | 4.5 KiB
            
                | text/x-python
            
             |
                PythonLexer
            
             / mercurial / repocache.py
          
                    History
                
                 |
                  Source
                 | Raw
                 |Copy content
                 |Copy permalink

        Yuya Nishihara
    
commandserver: preload repository in master server and reuse its file cache...

              r41035
            
      # repocache.py - in-memory repository cache for long-running services

      #

      # Copyright 2018 Yuya Nishihara <yuya@tcha.org>

      #

      # This software may be used and distributed according to the terms of the

      # GNU General Public License version 2 or any later version.

      from __future__ import absolute_import

      import collections

      import gc

      import threading

      from . import (

          error,

          hg,

          obsolete,

          scmutil,

          util,

      )

        Augie Fackler
    
formatting: blacken the codebase...

              r43346
            
        Yuya Nishihara
    
commandserver: preload repository in master server and reuse its file cache...

              r41035
            
      class repoloader(object):

          """Load repositories in background thread

          This is designed for a forking server. A cached repo cannot be obtained

          until the server fork()s a worker and the loader thread stops.

          """

          def __init__(self, ui, maxlen):

              self._ui = ui.copy()

              self._cache = util.lrucachedict(max=maxlen)

              # use deque and Event instead of Queue since deque can discard

              # old items to keep at most maxlen items.

              self._inqueue = collections.deque(maxlen=maxlen)

              self._accepting = False

              self._newentry = threading.Event()

              self._thread = None

          def start(self):

              assert not self._thread

              if self._inqueue.maxlen == 0:

                  # no need to spawn loader thread as the cache is disabled

                  return

              self._accepting = True

              self._thread = threading.Thread(target=self._mainloop)

              self._thread.start()

          def stop(self):

              if not self._thread:

                  return

              self._accepting = False

              self._newentry.set()

              self._thread.join()

              self._thread = None

              self._cache.clear()

              self._inqueue.clear()

          def load(self, path):

              """Request to load the specified repository in background"""

              self._inqueue.append(path)

              self._newentry.set()

          def get(self, path):

              """Return a cached repo if available

              This function must be called after fork(), where the loader thread

              is stopped. Otherwise, the returned repo might be updated by the

              loader thread.

              """

              if self._thread and self._thread.is_alive():

        Augie Fackler
    
formatting: blacken the codebase...

              r43346
            
                  raise error.ProgrammingError(

        Martin von Zweigbergk
    
cleanup: join string literals that are already on one line...

              r43387
            
                      b'cannot obtain cached repo while loader is active'

        Augie Fackler
    
formatting: blacken the codebase...

              r43346
            
                  )

        Yuya Nishihara
    
commandserver: preload repository in master server and reuse its file cache...

              r41035
            
              return self._cache.peek(path, None)

          def _mainloop(self):

              while self._accepting:

                  # Avoid heavy GC after fork(), which would cancel the benefit of

                  # COW. We assume that GIL is acquired while GC is underway in the

                  # loader thread. If that isn't true, we might have to move

                  # gc.collect() to the main thread so that fork() would never stop

                  # the thread where GC is in progress.

                  gc.collect()

                  self._newentry.wait()

                  while self._accepting:

                      self._newentry.clear()

                      try:

                          path = self._inqueue.popleft()

                      except IndexError:

                          break

                      scmutil.callcatch(self._ui, lambda: self._load(path))

          def _load(self, path):

              start = util.timer()

              # TODO: repo should be recreated if storage configuration changed

              try:

                  # pop before loading so inconsistent state wouldn't be exposed

                  repo = self._cache.pop(path)

              except KeyError:

                  repo = hg.repository(self._ui, path).unfiltered()

              _warmupcache(repo)

        Augie Fackler
    
formatting: blacken the codebase...

              r43346
            
              repo.ui.log(

                  b'repocache',

                  b'loaded repo into cache: %s (in %.3fs)\n',

                  path,

                  util.timer() - start,

              )

        Yuya Nishihara
    
commandserver: preload repository in master server and reuse its file cache...

              r41035
            
              self._cache.insert(path, repo)

        Augie Fackler
    
formatting: blacken the codebase...

              r43346
            
        Yuya Nishihara
    
commandserver: preload repository in master server and reuse its file cache...

              r41035
            
      # TODO: think about proper API of preloading cache

      def _warmupcache(repo):

          repo.invalidateall()

          repo.changelog

          repo.obsstore._all

          repo.obsstore.successors

          repo.obsstore.predecessors

          repo.obsstore.children

          for name in obsolete.cachefuncs:

              obsolete.getrevs(repo, name)

          repo._phasecache.loadphaserevs(repo)

        Augie Fackler
    
formatting: blacken the codebase...

              r43346
            
        Yuya Nishihara
    
commandserver: preload repository in master server and reuse its file cache...

              r41035
            
      # TODO: think about proper API of attaching preloaded attributes

      def copycache(srcrepo, destrepo):

          """Copy cached attributes from srcrepo to destrepo"""

          destfilecache = destrepo._filecache

          srcfilecache = srcrepo._filecache

        Augie Fackler
    
formatting: byteify all mercurial/ and hgext/ string literals...

              r43347
            
          if b'changelog' in srcfilecache:

              destfilecache[b'changelog'] = ce = srcfilecache[b'changelog']

        Yuya Nishihara
    
commandserver: preload repository in master server and reuse its file cache...

              r41035
            
              ce.obj.opener = ce.obj._realopener = destrepo.svfs

        Augie Fackler
    
formatting: byteify all mercurial/ and hgext/ string literals...

              r43347
            
          if b'obsstore' in srcfilecache:

              destfilecache[b'obsstore'] = ce = srcfilecache[b'obsstore']

        Yuya Nishihara
    
commandserver: preload repository in master server and reuse its file cache...

              r41035
            
              ce.obj.svfs = destrepo.svfs

        Augie Fackler
    
formatting: byteify all mercurial/ and hgext/ string literals...

              r43347
            
          if b'_phasecache' in srcfilecache:

              destfilecache[b'_phasecache'] = ce = srcfilecache[b'_phasecache']

        Yuya Nishihara
    
commandserver: preload repository in master server and reuse its file cache...

              r41035
            
              ce.obj.opener = destrepo.svfs

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

Yuya Nishihara commandserver: preload repository in master server and reuse its file cache...	r41035	# repocache.py - in-memory repository cache for long-running services
		#
		# Copyright 2018 Yuya Nishihara <yuya@tcha.org>
		#
		# This software may be used and distributed according to the terms of the
		# GNU General Public License version 2 or any later version.

		from __future__ import absolute_import

		import collections
		import gc
		import threading

		from . import (
		error,
		hg,
		obsolete,
		scmutil,
		util,
		)

Augie Fackler formatting: blacken the codebase...	r43346
Yuya Nishihara commandserver: preload repository in master server and reuse its file cache...	r41035	class repoloader(object):
		"""Load repositories in background thread

		This is designed for a forking server. A cached repo cannot be obtained
		until the server fork()s a worker and the loader thread stops.
		"""

		def __init__(self, ui, maxlen):
		self._ui = ui.copy()
		self._cache = util.lrucachedict(max=maxlen)
		# use deque and Event instead of Queue since deque can discard
		# old items to keep at most maxlen items.
		self._inqueue = collections.deque(maxlen=maxlen)
		self._accepting = False
		self._newentry = threading.Event()
		self._thread = None

		def start(self):
		assert not self._thread
		if self._inqueue.maxlen == 0:
		# no need to spawn loader thread as the cache is disabled
		return
		self._accepting = True
		self._thread = threading.Thread(target=self._mainloop)
		self._thread.start()

		def stop(self):
		if not self._thread:
		return
		self._accepting = False
		self._newentry.set()
		self._thread.join()
		self._thread = None
		self._cache.clear()
		self._inqueue.clear()

		def load(self, path):
		"""Request to load the specified repository in background"""
		self._inqueue.append(path)
		self._newentry.set()

		def get(self, path):
		"""Return a cached repo if available

		This function must be called after fork(), where the loader thread
		is stopped. Otherwise, the returned repo might be updated by the
		loader thread.
		"""
		if self._thread and self._thread.is_alive():
Augie Fackler formatting: blacken the codebase...	r43346	raise error.ProgrammingError(
Martin von Zweigbergk cleanup: join string literals that are already on one line...	r43387	b'cannot obtain cached repo while loader is active'
Augie Fackler formatting: blacken the codebase...	r43346	)
Yuya Nishihara commandserver: preload repository in master server and reuse its file cache...	r41035	return self._cache.peek(path, None)

		def _mainloop(self):
		while self._accepting:
		# Avoid heavy GC after fork(), which would cancel the benefit of
		# COW. We assume that GIL is acquired while GC is underway in the
		# loader thread. If that isn't true, we might have to move
		# gc.collect() to the main thread so that fork() would never stop
		# the thread where GC is in progress.
		gc.collect()

		self._newentry.wait()
		while self._accepting:
		self._newentry.clear()
		try:
		path = self._inqueue.popleft()
		except IndexError:
		break
		scmutil.callcatch(self._ui, lambda: self._load(path))

		def _load(self, path):
		start = util.timer()
		# TODO: repo should be recreated if storage configuration changed
		try:
		# pop before loading so inconsistent state wouldn't be exposed
		repo = self._cache.pop(path)
		except KeyError:
		repo = hg.repository(self._ui, path).unfiltered()
		_warmupcache(repo)
Augie Fackler formatting: blacken the codebase...	r43346	repo.ui.log(
		b'repocache',
		b'loaded repo into cache: %s (in %.3fs)\n',
		path,
		util.timer() - start,
		)
Yuya Nishihara commandserver: preload repository in master server and reuse its file cache...	r41035	self._cache.insert(path, repo)

Augie Fackler formatting: blacken the codebase...	r43346
Yuya Nishihara commandserver: preload repository in master server and reuse its file cache...	r41035	# TODO: think about proper API of preloading cache
		def _warmupcache(repo):
		repo.invalidateall()
		repo.changelog
		repo.obsstore._all
		repo.obsstore.successors
		repo.obsstore.predecessors
		repo.obsstore.children
		for name in obsolete.cachefuncs:
		obsolete.getrevs(repo, name)
		repo._phasecache.loadphaserevs(repo)

Augie Fackler formatting: blacken the codebase...	r43346
Yuya Nishihara commandserver: preload repository in master server and reuse its file cache...	r41035	# TODO: think about proper API of attaching preloaded attributes
		def copycache(srcrepo, destrepo):
		"""Copy cached attributes from srcrepo to destrepo"""
		destfilecache = destrepo._filecache
		srcfilecache = srcrepo._filecache
Augie Fackler formatting: byteify all mercurial/ and hgext/ string literals...	r43347	if b'changelog' in srcfilecache:
		destfilecache[b'changelog'] = ce = srcfilecache[b'changelog']
Yuya Nishihara commandserver: preload repository in master server and reuse its file cache...	r41035	ce.obj.opener = ce.obj._realopener = destrepo.svfs
Augie Fackler formatting: byteify all mercurial/ and hgext/ string literals...	r43347	if b'obsstore' in srcfilecache:
		destfilecache[b'obsstore'] = ce = srcfilecache[b'obsstore']
Yuya Nishihara commandserver: preload repository in master server and reuse its file cache...	r41035	ce.obj.svfs = destrepo.svfs
Augie Fackler formatting: byteify all mercurial/ and hgext/ string literals...	r43347	if b'_phasecache' in srcfilecache:
		destfilecache[b'_phasecache'] = ce = srcfilecache[b'_phasecache']
Yuya Nishihara commandserver: preload repository in master server and reuse its file cache...	r41035	ce.obj.opener = destrepo.svfs