upstream/mercurial-mirror Files · tests/testlib/persistent-nodemap-race-ext.py

transaction: do not rely on a global variable to post_finalize file...

transaction: do not rely on a global variable to post_finalize file We can just add a new argument to the `addfilegenerator` function. This is more explicit and therefor clearer and less error prone. Differential Revision: https://phab.mercurial-scm.org/D12125

marmoute - - Load All Authors

File last commit:

r48852:52018f8e stable


                r49534:21ac6aed

default

Download file

             persistent-nodemap-race-ext.py
        
                    294 lines
            
             | 10.2 KiB
            
                | text/x-python
            
             |
                PythonLexer
            
             / tests / testlib / persistent-nodemap-race-ext.py
          
                    History
                
                 |
                  Source
                 | Raw
                 |Copy content
                 |Copy permalink

        marmoute
    
persistent-nodemap: introduce a test to highlight possible race...

              r48852
            
      """Create the race condition for issue6554

      The persistent nodemap issues had an issue where a second writer could

      overwrite the data that a previous write just wrote. The would break the append

      only garantee of the persistent nodemap and could confuse reader. This

      extensions create all the necessary synchronisation point to the race condition

      to happen.

      It involves 3 process <LEFT> (a writer) <RIGHT> (a writer) and <READER>

      [1] <LEFT> take the lock and start a transaction

      [2] <LEFT> updated `00changelog.i` with the new data

      [3] <RIGHT> reads:

          - the new changelog index `00changelog.i`

          - the old `00changelog.n`

      [4] <LEFT> update the persistent nodemap:

          - writing new data from the last valid offset

          - updating the docket (00changelog.n)

      [5] <LEFT> release the lock

      [6] <RIGHT> grab the lock and run `repo.invalidate`

      [7] <READER> reads:

          - the changelog index after <LEFT> write

          - the nodemap docket after <LEFT> write

      [8] <RIGHT> reload the changelog since `00changelog.n` changed

          /!\ This is the faulty part in issue 6554, the outdated docket is kept

      [9] <RIGHT> write:

          - the changelog index (00changelog.i)

          - the nodemap data (00changelog*.nd)

            /!\ if the outdated docket is used, the write starts from the same ofset

            /!\ as in [4], overwriting data that <LEFT> wrote in step [4].

          - the nodemap docket (00changelog.n)

      [10] <READER> reads the nodemap data from `00changelog*.nd`

           /!\ if step [9] was wrong, the data matching the docket that <READER>

           /!\ loaded have been overwritten and the expected root-nodes is no longer

           /!\ valid.

      """

      from __future__ import print_function

      import os

      from mercurial.revlogutils.constants import KIND_CHANGELOG

      from mercurial import (

          changelog,

          encoding,

          extensions,

          localrepo,

          node,

          pycompat,

          registrar,

          testing,

          util,

      )

      from mercurial.revlogutils import (

          nodemap as nodemaputil,

      )

      configtable = {}

      configitem = registrar.configitem(configtable)

      configitem(b'devel', b'nodemap-race.role', default=None)

      cmdtable = {}

      command = registrar.command(cmdtable)

      LEFT = b'left'

      RIGHT = b'right'

      READER = b'reader'

      SYNC_DIR = os.path.join(encoding.environ[b'TESTTMP'], b'sync-files')

      # mark the end of step [1]

      FILE_LEFT_LOCKED = os.path.join(SYNC_DIR, b'left-locked')

      # mark that step [3] is ready to run.

      FILE_RIGHT_READY_TO_LOCK = os.path.join(SYNC_DIR, b'right-ready-to-lock')

      # mark the end of step [2]

      FILE_LEFT_CL_DATA_WRITE = os.path.join(SYNC_DIR, b'left-data')

      # mark the end of step [4]

      FILE_LEFT_CL_NODEMAP_WRITE = os.path.join(SYNC_DIR, b'left-nodemap')

      # mark the end of step [3]

      FILE_RIGHT_CL_NODEMAP_READ = os.path.join(SYNC_DIR, b'right-nodemap')

      # mark that step [9] is read to run

      FILE_RIGHT_CL_NODEMAP_PRE_WRITE = os.path.join(

          SYNC_DIR, b'right-pre-nodemap-write'

      )

      # mark that step [9] has run.

      FILE_RIGHT_CL_NODEMAP_POST_WRITE = os.path.join(

          SYNC_DIR, b'right-post-nodemap-write'

      )

      # mark that step [7] is ready to run

      FILE_READER_READY = os.path.join(SYNC_DIR, b'reader-ready')

      # mark that step [7] has run

      FILE_READER_READ_DOCKET = os.path.join(SYNC_DIR, b'reader-read-docket')

      def _print(*args, **kwargs):

          print(*args, **kwargs)

      def _role(repo):

          """find the role associated with the process"""

          return repo.ui.config(b'devel', b'nodemap-race.role')

      def wrap_changelog_finalize(orig, cl, tr):

          """wrap the update of `00changelog.i` during transaction finalization

          This is useful for synchronisation before or after the file is updated on disk.

          """

          role = getattr(tr, '_race_role', None)

          if role == RIGHT:

              print('right ready to write, waiting for reader')

              testing.wait_file(FILE_READER_READY)

              testing.write_file(FILE_RIGHT_CL_NODEMAP_PRE_WRITE)

              testing.wait_file(FILE_READER_READ_DOCKET)

              print('right proceeding with writing its changelog index and nodemap')

          ret = orig(cl, tr)

          print("finalized changelog write")

          if role == LEFT:

              testing.write_file(FILE_LEFT_CL_DATA_WRITE)

          return ret

      def wrap_persist_nodemap(orig, tr, revlog, *args, **kwargs):

          """wrap the update of `00changelog.n` and `*.nd` during tr finalization

          This is useful for synchronisation before or after the files are updated on

          disk.

          """

          is_cl = revlog.target[0] == KIND_CHANGELOG

          role = getattr(tr, '_race_role', None)

          if is_cl:

              if role == LEFT:

                  testing.wait_file(FILE_RIGHT_CL_NODEMAP_READ)

          if is_cl:

              print("persisting changelog nodemap")

              print("  new data start at", revlog._nodemap_docket.data_length)

          ret = orig(tr, revlog, *args, **kwargs)

          if is_cl:

              print("persisted changelog nodemap")

              print_nodemap_details(revlog)

              if role == LEFT:

                  testing.write_file(FILE_LEFT_CL_NODEMAP_WRITE)

              elif role == RIGHT:

                  testing.write_file(FILE_RIGHT_CL_NODEMAP_POST_WRITE)

          return ret

      def print_nodemap_details(cl):

          """print relevant information about the nodemap docket currently in memory"""

          dkt = cl._nodemap_docket

          print('docket-details:')

          if dkt is None:

              print('  <no-docket>')

              return

          print('  uid:        ', pycompat.sysstr(dkt.uid))

          print('  actual-tip: ', cl.tiprev())

          print('  tip-rev:    ', dkt.tip_rev)

          print('  data-length:', dkt.data_length)

      def wrap_persisted_data(orig, revlog):

          """print some information about the nodemap information we just read

          Used by the <READER> process only.

          """

          ret = orig(revlog)

          if ret is not None:

              docket, data = ret

              file_path = nodemaputil._rawdata_filepath(revlog, docket)

              file_path = revlog.opener.join(file_path)

              file_size = os.path.getsize(file_path)

              print('record-data-length:', docket.data_length)

              print('actual-data-length:', len(data))

              print('file-actual-length:', file_size)

          return ret

      def sync_read(orig):

          """used by <READER> to force the race window

          This make sure we read the docker from <LEFT> while reading the datafile

          after <RIGHT> write.

          """

          orig()

          testing.write_file(FILE_READER_READ_DOCKET)

          print('reader: nodemap docket read')

          testing.wait_file(FILE_RIGHT_CL_NODEMAP_POST_WRITE)

      def uisetup(ui):

          class RacedRepo(localrepo.localrepository):

              def lock(self, wait=True):

                  # make sure <RIGHT> as the "Wrong" information in memory before

                  # grabbing the lock

                  newlock = self._currentlock(self._lockref) is None

                  if newlock and _role(self) == LEFT:

                      cl = self.unfiltered().changelog

                      print_nodemap_details(cl)

                  elif newlock and _role(self) == RIGHT:

                      testing.write_file(FILE_RIGHT_READY_TO_LOCK)

                      print('nodemap-race: right side start of the locking sequence')

                      testing.wait_file(FILE_LEFT_LOCKED)

                      testing.wait_file(FILE_LEFT_CL_DATA_WRITE)

                      self.invalidate(clearfilecache=True)

                      print('nodemap-race: right side reading changelog')

                      cl = self.unfiltered().changelog

                      tiprev = cl.tiprev()

                      tip = cl.node(tiprev)

                      tiprev2 = cl.rev(tip)

                      if tiprev != tiprev2:

                          raise RuntimeError(

                              'bad tip -round-trip %d %d' % (tiprev, tiprev2)

                          )

                      testing.write_file(FILE_RIGHT_CL_NODEMAP_READ)

                      print('nodemap-race: right side reading of changelog is done')

                      print_nodemap_details(cl)

                      testing.wait_file(FILE_LEFT_CL_NODEMAP_WRITE)

                      print('nodemap-race: right side ready to wait for the lock')

                  ret = super(RacedRepo, self).lock(wait=wait)

                  if newlock and _role(self) == LEFT:

                      print('nodemap-race: left side locked and ready to commit')

                      testing.write_file(FILE_LEFT_LOCKED)

                      testing.wait_file(FILE_RIGHT_READY_TO_LOCK)

                      cl = self.unfiltered().changelog

                      print_nodemap_details(cl)

                  elif newlock and _role(self) == RIGHT:

                      print('nodemap-race: right side locked and ready to commit')

                      cl = self.unfiltered().changelog

                      print_nodemap_details(cl)

                  return ret

              def transaction(self, *args, **kwargs):

                  # duck punch the role on the transaction to help other pieces of code

                  tr = super(RacedRepo, self).transaction(*args, **kwargs)

                  tr._race_role = _role(self)

                  return tr

          localrepo.localrepository = RacedRepo

          extensions.wrapfunction(

              nodemaputil, 'persist_nodemap', wrap_persist_nodemap

          )

          extensions.wrapfunction(

              changelog.changelog, '_finalize', wrap_changelog_finalize

          )

      def reposetup(ui, repo):

          if _role(repo) == READER:

              extensions.wrapfunction(

                  nodemaputil, 'persisted_data', wrap_persisted_data

              )

              extensions.wrapfunction(nodemaputil, 'test_race_hook_1', sync_read)

              class ReaderRepo(repo.__class__):

                  @util.propertycache

                  def changelog(self):

                      print('reader ready to read the changelog, waiting for right')

                      testing.write_file(FILE_READER_READY)

                      testing.wait_file(FILE_RIGHT_CL_NODEMAP_PRE_WRITE)

                      return super(ReaderRepo, self).changelog

              repo.__class__ = ReaderRepo

      @command(b'check-nodemap-race')

      def cmd_check_nodemap_race(ui, repo):

          """Run proper <READER> access in the race Windows and check nodemap content"""

          repo = repo.unfiltered()

          print('reader: reading changelog')

          cl = repo.changelog

          print('reader: changelog read')

          print_nodemap_details(cl)

          tip_rev = cl.tiprev()

          tip_node = cl.node(tip_rev)

          print('tip-rev: ', tip_rev)

          print('tip-node:', node.short(tip_node).decode('ascii'))

          print('node-rev:', cl.rev(tip_node))

          for r in cl.revs():

              n = cl.node(r)

              try:

                  r2 = cl.rev(n)

              except ValueError as exc:

                  print('error while checking revision:', r)

                  print(' ', exc)

                  return 1

              else:

                  if r2 != r:

                      print('revision %d is missing from the nodemap' % r)

                      return 1

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

marmoute persistent-nodemap: introduce a test to highlight possible race...	r48852	"""Create the race condition for issue6554

		The persistent nodemap issues had an issue where a second writer could
		overwrite the data that a previous write just wrote. The would break the append
		only garantee of the persistent nodemap and could confuse reader. This
		extensions create all the necessary synchronisation point to the race condition
		to happen.

		It involves 3 process <LEFT> (a writer) <RIGHT> (a writer) and <READER>

		[1] <LEFT> take the lock and start a transaction
		[2] <LEFT> updated `00changelog.i` with the new data
		[3] <RIGHT> reads:
		- the new changelog index `00changelog.i`
		- the old `00changelog.n`
		[4] <LEFT> update the persistent nodemap:
		- writing new data from the last valid offset
		- updating the docket (00changelog.n)
		[5] <LEFT> release the lock
		[6] <RIGHT> grab the lock and run `repo.invalidate`
		[7] <READER> reads:
		- the changelog index after <LEFT> write
		- the nodemap docket after <LEFT> write
		[8] <RIGHT> reload the changelog since `00changelog.n` changed
		/!\ This is the faulty part in issue 6554, the outdated docket is kept
		[9] <RIGHT> write:
		- the changelog index (00changelog.i)
		- the nodemap data (00changelog*.nd)
		/!\ if the outdated docket is used, the write starts from the same ofset
		/!\ as in [4], overwriting data that <LEFT> wrote in step [4].
		- the nodemap docket (00changelog.n)
		[10] <READER> reads the nodemap data from `00changelog*.nd`
		/!\ if step [9] was wrong, the data matching the docket that <READER>
		/!\ loaded have been overwritten and the expected root-nodes is no longer
		/!\ valid.
		"""

		from __future__ import print_function

		import os

		from mercurial.revlogutils.constants import KIND_CHANGELOG

		from mercurial import (
		changelog,
		encoding,
		extensions,
		localrepo,
		node,
		pycompat,
		registrar,
		testing,
		util,
		)

		from mercurial.revlogutils import (
		nodemap as nodemaputil,
		)

		configtable = {}
		configitem = registrar.configitem(configtable)

		configitem(b'devel', b'nodemap-race.role', default=None)

		cmdtable = {}
		command = registrar.command(cmdtable)

		LEFT = b'left'
		RIGHT = b'right'
		READER = b'reader'

		SYNC_DIR = os.path.join(encoding.environ[b'TESTTMP'], b'sync-files')

		# mark the end of step [1]
		FILE_LEFT_LOCKED = os.path.join(SYNC_DIR, b'left-locked')
		# mark that step [3] is ready to run.
		FILE_RIGHT_READY_TO_LOCK = os.path.join(SYNC_DIR, b'right-ready-to-lock')

		# mark the end of step [2]
		FILE_LEFT_CL_DATA_WRITE = os.path.join(SYNC_DIR, b'left-data')
		# mark the end of step [4]
		FILE_LEFT_CL_NODEMAP_WRITE = os.path.join(SYNC_DIR, b'left-nodemap')
		# mark the end of step [3]
		FILE_RIGHT_CL_NODEMAP_READ = os.path.join(SYNC_DIR, b'right-nodemap')
		# mark that step [9] is read to run
		FILE_RIGHT_CL_NODEMAP_PRE_WRITE = os.path.join(
		SYNC_DIR, b'right-pre-nodemap-write'
		)
		# mark that step [9] has run.
		FILE_RIGHT_CL_NODEMAP_POST_WRITE = os.path.join(
		SYNC_DIR, b'right-post-nodemap-write'
		)
		# mark that step [7] is ready to run
		FILE_READER_READY = os.path.join(SYNC_DIR, b'reader-ready')
		# mark that step [7] has run
		FILE_READER_READ_DOCKET = os.path.join(SYNC_DIR, b'reader-read-docket')


		def _print(args, *kwargs):
		print(args, *kwargs)


		def _role(repo):
		"""find the role associated with the process"""
		return repo.ui.config(b'devel', b'nodemap-race.role')


		def wrap_changelog_finalize(orig, cl, tr):
		"""wrap the update of `00changelog.i` during transaction finalization

		This is useful for synchronisation before or after the file is updated on disk.
		"""
		role = getattr(tr, '_race_role', None)
		if role == RIGHT:
		print('right ready to write, waiting for reader')
		testing.wait_file(FILE_READER_READY)
		testing.write_file(FILE_RIGHT_CL_NODEMAP_PRE_WRITE)
		testing.wait_file(FILE_READER_READ_DOCKET)
		print('right proceeding with writing its changelog index and nodemap')
		ret = orig(cl, tr)
		print("finalized changelog write")
		if role == LEFT:
		testing.write_file(FILE_LEFT_CL_DATA_WRITE)
		return ret


		def wrap_persist_nodemap(orig, tr, revlog, args, *kwargs):
		"""wrap the update of `00changelog.n` and `*.nd` during tr finalization

		This is useful for synchronisation before or after the files are updated on
		disk.
		"""
		is_cl = revlog.target[0] == KIND_CHANGELOG
		role = getattr(tr, '_race_role', None)
		if is_cl:
		if role == LEFT:
		testing.wait_file(FILE_RIGHT_CL_NODEMAP_READ)
		if is_cl:
		print("persisting changelog nodemap")
		print(" new data start at", revlog._nodemap_docket.data_length)
		ret = orig(tr, revlog, args, *kwargs)
		if is_cl:
		print("persisted changelog nodemap")
		print_nodemap_details(revlog)
		if role == LEFT:
		testing.write_file(FILE_LEFT_CL_NODEMAP_WRITE)
		elif role == RIGHT:
		testing.write_file(FILE_RIGHT_CL_NODEMAP_POST_WRITE)
		return ret


		def print_nodemap_details(cl):
		"""print relevant information about the nodemap docket currently in memory"""
		dkt = cl._nodemap_docket
		print('docket-details:')
		if dkt is None:
		print(' <no-docket>')
		return
		print(' uid: ', pycompat.sysstr(dkt.uid))
		print(' actual-tip: ', cl.tiprev())
		print(' tip-rev: ', dkt.tip_rev)
		print(' data-length:', dkt.data_length)


		def wrap_persisted_data(orig, revlog):
		"""print some information about the nodemap information we just read

		Used by the <READER> process only.
		"""
		ret = orig(revlog)
		if ret is not None:
		docket, data = ret
		file_path = nodemaputil._rawdata_filepath(revlog, docket)
		file_path = revlog.opener.join(file_path)
		file_size = os.path.getsize(file_path)
		print('record-data-length:', docket.data_length)
		print('actual-data-length:', len(data))
		print('file-actual-length:', file_size)
		return ret


		def sync_read(orig):
		"""used by <READER> to force the race window

		This make sure we read the docker from <LEFT> while reading the datafile
		after <RIGHT> write.
		"""
		orig()
		testing.write_file(FILE_READER_READ_DOCKET)
		print('reader: nodemap docket read')
		testing.wait_file(FILE_RIGHT_CL_NODEMAP_POST_WRITE)


		def uisetup(ui):
		class RacedRepo(localrepo.localrepository):
		def lock(self, wait=True):
		# make sure <RIGHT> as the "Wrong" information in memory before
		# grabbing the lock
		newlock = self._currentlock(self._lockref) is None
		if newlock and _role(self) == LEFT:
		cl = self.unfiltered().changelog
		print_nodemap_details(cl)
		elif newlock and _role(self) == RIGHT:
		testing.write_file(FILE_RIGHT_READY_TO_LOCK)
		print('nodemap-race: right side start of the locking sequence')
		testing.wait_file(FILE_LEFT_LOCKED)
		testing.wait_file(FILE_LEFT_CL_DATA_WRITE)
		self.invalidate(clearfilecache=True)
		print('nodemap-race: right side reading changelog')
		cl = self.unfiltered().changelog
		tiprev = cl.tiprev()
		tip = cl.node(tiprev)
		tiprev2 = cl.rev(tip)
		if tiprev != tiprev2:
		raise RuntimeError(
		'bad tip -round-trip %d %d' % (tiprev, tiprev2)
		)
		testing.write_file(FILE_RIGHT_CL_NODEMAP_READ)
		print('nodemap-race: right side reading of changelog is done')
		print_nodemap_details(cl)
		testing.wait_file(FILE_LEFT_CL_NODEMAP_WRITE)
		print('nodemap-race: right side ready to wait for the lock')
		ret = super(RacedRepo, self).lock(wait=wait)
		if newlock and _role(self) == LEFT:
		print('nodemap-race: left side locked and ready to commit')
		testing.write_file(FILE_LEFT_LOCKED)
		testing.wait_file(FILE_RIGHT_READY_TO_LOCK)
		cl = self.unfiltered().changelog
		print_nodemap_details(cl)
		elif newlock and _role(self) == RIGHT:
		print('nodemap-race: right side locked and ready to commit')
		cl = self.unfiltered().changelog
		print_nodemap_details(cl)
		return ret

		def transaction(self, args, *kwargs):
		# duck punch the role on the transaction to help other pieces of code
		tr = super(RacedRepo, self).transaction(args, *kwargs)
		tr._race_role = _role(self)
		return tr

		localrepo.localrepository = RacedRepo

		extensions.wrapfunction(
		nodemaputil, 'persist_nodemap', wrap_persist_nodemap
		)
		extensions.wrapfunction(
		changelog.changelog, '_finalize', wrap_changelog_finalize
		)


		def reposetup(ui, repo):
		if _role(repo) == READER:
		extensions.wrapfunction(
		nodemaputil, 'persisted_data', wrap_persisted_data
		)
		extensions.wrapfunction(nodemaputil, 'test_race_hook_1', sync_read)

		class ReaderRepo(repo.__class__):
		@util.propertycache
		def changelog(self):
		print('reader ready to read the changelog, waiting for right')
		testing.write_file(FILE_READER_READY)
		testing.wait_file(FILE_RIGHT_CL_NODEMAP_PRE_WRITE)
		return super(ReaderRepo, self).changelog

		repo.__class__ = ReaderRepo


		@command(b'check-nodemap-race')
		def cmd_check_nodemap_race(ui, repo):
		"""Run proper <READER> access in the race Windows and check nodemap content"""
		repo = repo.unfiltered()
		print('reader: reading changelog')
		cl = repo.changelog
		print('reader: changelog read')
		print_nodemap_details(cl)
		tip_rev = cl.tiprev()
		tip_node = cl.node(tip_rev)
		print('tip-rev: ', tip_rev)
		print('tip-node:', node.short(tip_node).decode('ascii'))
		print('node-rev:', cl.rev(tip_node))
		for r in cl.revs():
		n = cl.node(r)
		try:
		r2 = cl.rev(n)
		except ValueError as exc:
		print('error while checking revision:', r)
		print(' ', exc)
		return 1
		else:
		if r2 != r:
		print('revision %d is missing from the nodemap' % r)
		return 1