"""Create the race condition for issue6554 The persistent nodemap issues had an issue where a second writer could overwrite the data that a previous write just wrote. The would break the append only garantee of the persistent nodemap and could confuse reader. This extensions create all the necessary synchronisation point to the race condition to happen. It involves 3 process (a writer) (a writer) and [1] take the lock and start a transaction [2] updated `00changelog.i` with the new data [3] reads: - the new changelog index `00changelog.i` - the old `00changelog.n` [4] update the persistent nodemap: - writing new data from the last valid offset - updating the docket (00changelog.n) [5] release the lock [6] grab the lock and run `repo.invalidate` [7] reads: - the changelog index after write - the nodemap docket after write [8] reload the changelog since `00changelog.n` changed /!\ This is the faulty part in issue 6554, the outdated docket is kept [9] write: - the changelog index (00changelog.i) - the nodemap data (00changelog*.nd) /!\ if the outdated docket is used, the write starts from the same ofset /!\ as in [4], overwriting data that wrote in step [4]. - the nodemap docket (00changelog.n) [10] reads the nodemap data from `00changelog*.nd` /!\ if step [9] was wrong, the data matching the docket that /!\ loaded have been overwritten and the expected root-nodes is no longer /!\ valid. """ import os from mercurial.revlogutils.constants import KIND_CHANGELOG from mercurial import ( changelog, encoding, extensions, localrepo, node, pycompat, registrar, testing, util, ) from mercurial.revlogutils import ( nodemap as nodemaputil, ) configtable = {} configitem = registrar.configitem(configtable) configitem(b'devel', b'nodemap-race.role', default=None) cmdtable = {} command = registrar.command(cmdtable) LEFT = b'left' RIGHT = b'right' READER = b'reader' SYNC_DIR = os.path.join(encoding.environ[b'TESTTMP'], b'sync-files') # mark the end of step [1] FILE_LEFT_LOCKED = os.path.join(SYNC_DIR, b'left-locked') # mark that step [3] is ready to run. FILE_RIGHT_READY_TO_LOCK = os.path.join(SYNC_DIR, b'right-ready-to-lock') # mark the end of step [2] FILE_LEFT_CL_DATA_WRITE = os.path.join(SYNC_DIR, b'left-data') # mark the end of step [4] FILE_LEFT_CL_NODEMAP_WRITE = os.path.join(SYNC_DIR, b'left-nodemap') # mark the end of step [3] FILE_RIGHT_CL_NODEMAP_READ = os.path.join(SYNC_DIR, b'right-nodemap') # mark that step [9] is read to run FILE_RIGHT_CL_NODEMAP_PRE_WRITE = os.path.join( SYNC_DIR, b'right-pre-nodemap-write' ) # mark that step [9] has run. FILE_RIGHT_CL_NODEMAP_POST_WRITE = os.path.join( SYNC_DIR, b'right-post-nodemap-write' ) # mark that step [7] is ready to run FILE_READER_READY = os.path.join(SYNC_DIR, b'reader-ready') # mark that step [7] has run FILE_READER_READ_DOCKET = os.path.join(SYNC_DIR, b'reader-read-docket') def _print(*args, **kwargs): print(*args, **kwargs) def _role(repo): """find the role associated with the process""" return repo.ui.config(b'devel', b'nodemap-race.role') def wrap_changelog_finalize(orig, cl, tr): """wrap the update of `00changelog.i` during transaction finalization This is useful for synchronisation before or after the file is updated on disk. """ role = getattr(tr, '_race_role', None) if role == RIGHT: print('right ready to write, waiting for reader') testing.wait_file(FILE_READER_READY) testing.write_file(FILE_RIGHT_CL_NODEMAP_PRE_WRITE) testing.wait_file(FILE_READER_READ_DOCKET) print('right proceeding with writing its changelog index and nodemap') ret = orig(cl, tr) print("finalized changelog write") if role == LEFT: testing.write_file(FILE_LEFT_CL_DATA_WRITE) return ret def wrap_persist_nodemap(orig, tr, revlog, *args, **kwargs): """wrap the update of `00changelog.n` and `*.nd` during tr finalization This is useful for synchronisation before or after the files are updated on disk. """ is_cl = revlog.target[0] == KIND_CHANGELOG role = getattr(tr, '_race_role', None) if is_cl: if role == LEFT: testing.wait_file(FILE_RIGHT_CL_NODEMAP_READ) if is_cl: print("persisting changelog nodemap") print(" new data start at", revlog._nodemap_docket.data_length) ret = orig(tr, revlog, *args, **kwargs) if is_cl: print("persisted changelog nodemap") print_nodemap_details(revlog) if role == LEFT: testing.write_file(FILE_LEFT_CL_NODEMAP_WRITE) elif role == RIGHT: testing.write_file(FILE_RIGHT_CL_NODEMAP_POST_WRITE) return ret def print_nodemap_details(cl): """print relevant information about the nodemap docket currently in memory""" dkt = cl._nodemap_docket print('docket-details:') if dkt is None: print(' ') return print(' uid: ', pycompat.sysstr(dkt.uid)) print(' actual-tip: ', cl.tiprev()) print(' tip-rev: ', dkt.tip_rev) print(' data-length:', dkt.data_length) def wrap_persisted_data(orig, revlog): """print some information about the nodemap information we just read Used by the process only. """ ret = orig(revlog) if ret is not None: docket, data = ret file_path = nodemaputil._rawdata_filepath(revlog, docket) file_path = revlog.opener.join(file_path) file_size = os.path.getsize(file_path) print('record-data-length:', docket.data_length) print('actual-data-length:', len(data)) print('file-actual-length:', file_size) return ret def sync_read(orig): """used by to force the race window This make sure we read the docker from while reading the datafile after write. """ orig() testing.write_file(FILE_READER_READ_DOCKET) print('reader: nodemap docket read') testing.wait_file(FILE_RIGHT_CL_NODEMAP_POST_WRITE) def uisetup(ui): class RacedRepo(localrepo.localrepository): def lock(self, wait=True): # make sure as the "Wrong" information in memory before # grabbing the lock newlock = self._currentlock(self._lockref) is None if newlock and _role(self) == LEFT: cl = self.unfiltered().changelog print_nodemap_details(cl) elif newlock and _role(self) == RIGHT: testing.write_file(FILE_RIGHT_READY_TO_LOCK) print('nodemap-race: right side start of the locking sequence') testing.wait_file(FILE_LEFT_LOCKED) testing.wait_file(FILE_LEFT_CL_DATA_WRITE) self.invalidate(clearfilecache=True) print('nodemap-race: right side reading changelog') cl = self.unfiltered().changelog tiprev = cl.tiprev() tip = cl.node(tiprev) tiprev2 = cl.rev(tip) if tiprev != tiprev2: raise RuntimeError( 'bad tip -round-trip %d %d' % (tiprev, tiprev2) ) testing.write_file(FILE_RIGHT_CL_NODEMAP_READ) print('nodemap-race: right side reading of changelog is done') print_nodemap_details(cl) testing.wait_file(FILE_LEFT_CL_NODEMAP_WRITE) print('nodemap-race: right side ready to wait for the lock') ret = super(RacedRepo, self).lock(wait=wait) if newlock and _role(self) == LEFT: print('nodemap-race: left side locked and ready to commit') testing.write_file(FILE_LEFT_LOCKED) testing.wait_file(FILE_RIGHT_READY_TO_LOCK) cl = self.unfiltered().changelog print_nodemap_details(cl) elif newlock and _role(self) == RIGHT: print('nodemap-race: right side locked and ready to commit') cl = self.unfiltered().changelog print_nodemap_details(cl) return ret def transaction(self, *args, **kwargs): # duck punch the role on the transaction to help other pieces of code tr = super(RacedRepo, self).transaction(*args, **kwargs) tr._race_role = _role(self) return tr localrepo.localrepository = RacedRepo extensions.wrapfunction( nodemaputil, 'persist_nodemap', wrap_persist_nodemap ) extensions.wrapfunction( changelog.changelog, '_finalize', wrap_changelog_finalize ) def reposetup(ui, repo): if _role(repo) == READER: extensions.wrapfunction( nodemaputil, 'persisted_data', wrap_persisted_data ) extensions.wrapfunction(nodemaputil, 'test_race_hook_1', sync_read) class ReaderRepo(repo.__class__): @util.propertycache def changelog(self): print('reader ready to read the changelog, waiting for right') testing.write_file(FILE_READER_READY) testing.wait_file(FILE_RIGHT_CL_NODEMAP_PRE_WRITE) return super(ReaderRepo, self).changelog repo.__class__ = ReaderRepo @command(b'check-nodemap-race') def cmd_check_nodemap_race(ui, repo): """Run proper access in the race Windows and check nodemap content""" repo = repo.unfiltered() print('reader: reading changelog') cl = repo.changelog print('reader: changelog read') print_nodemap_details(cl) tip_rev = cl.tiprev() tip_node = cl.node(tip_rev) print('tip-rev: ', tip_rev) print('tip-node:', node.short(tip_node).decode('ascii')) print('node-rev:', cl.rev(tip_node)) for r in cl.revs(): n = cl.node(r) try: r2 = cl.rev(n) except ValueError as exc: print('error while checking revision:', r) print(' ', exc) return 1 else: if r2 != r: print('revision %d is missing from the nodemap' % r) return 1