upstream/mercurial-mirror Files · mercurial/revlogutils/sidedata.py

sidedatacopies: read rename information from sidedata...

sidedatacopies: read rename information from sidedata Repository using the new format now use changeset centric algorithm and read the copies information from the changelog sidedata. Differential Revision: https://phab.mercurial-scm.org/D6953

marmoute - - Load All Authors

File last commit:

r43412:beed7ce6 default


                r43416:0171483b

default

Download file

             sidedata.py
        
                    106 lines
            
             | 3.2 KiB
            
                | text/x-python
            
             |
                PythonLexer
            
             / mercurial / revlogutils / sidedata.py
          
                    History
                
                 |
                  Source
                 | Raw
                 |Copy content
                 |Copy permalink

        marmoute
    
sidedata: add a new module with basic documentation...

              r43301
            
      # sidedata.py - Logic around store extra data alongside revlog revisions

      #

      # Copyright 2019 Pierre-Yves David <pierre-yves.david@octobus.net)

      #

      # This software may be used and distributed according to the terms of the

      # GNU General Public License version 2 or any later version.

      """core code for "sidedata" support

      The "sidedata" are stored alongside the revision without actually being part of

      its content and not affecting its hash. It's main use cases is to cache

      important information related to a changesets.

      The current implementation is experimental and subject to changes. Do not rely

      on it in production.

      Sidedata are stored in the revlog itself, withing the revision rawtext. They

      are inserted, removed from it using the flagprocessors mechanism. The following

      format is currently used::

          initial header:

              <number of sidedata; 2 bytes>

          sidedata (repeated N times):

              <sidedata-key; 2 bytes>

              <sidedata-entry-length: 4 bytes>

              <sidedata-content-sha1-digest: 20 bytes>

              <sidedata-content; X bytes>

          normal raw text:

              <all bytes remaining in the rawtext>

      This is a simple and effective format. It should be enought to experiment with

      the concept.

      """

      from __future__ import absolute_import

        marmoute
    
sidedata: add a function to read sidedata from revlog raw text...

              r43302
            
      import hashlib

      import struct

      from .. import error

        marmoute
    
sidedata: test we can successfully write sidedata...

              r43308
            
      ## sidedata type constant

      # reserve a block for testing purposes.

      SD_TEST1 = 1

      SD_TEST2 = 2

      SD_TEST3 = 3

      SD_TEST4 = 4

      SD_TEST5 = 5

      SD_TEST6 = 6

      SD_TEST7 = 7

        marmoute
    
sidedatacopies: write copies information in sidedata when applicable...

              r43412
            
      # key to store copies related information

      SD_P1COPIES = 8

      SD_P2COPIES = 9

      SD_FILESADDED = 10

      SD_FILESREMOVED = 11

        marmoute
    
sidedata: test we can successfully write sidedata...

              r43308
            
      # internal format constant

        marmoute
    
sidedata: adjust string for python3...

              r43318
            
      SIDEDATA_HEADER = struct.Struct(r'>H')

      SIDEDATA_ENTRY = struct.Struct(r'>HL20s')

        marmoute
    
sidedata: add a function to read sidedata from revlog raw text...

              r43302
            
        Augie Fackler
    
formatting: blacken the codebase...

              r43346
            
        marmoute
    
sidedata: add a function to write sidedata into a raw text...

              r43303
            
      def sidedatawriteprocessor(rl, text, sidedata):

          sidedata = list(sidedata.items())

          sidedata.sort()

          rawtext = [SIDEDATA_HEADER.pack(len(sidedata))]

          for key, value in sidedata:

              digest = hashlib.sha1(value).digest()

              rawtext.append(SIDEDATA_ENTRY.pack(key, len(value), digest))

          for key, value in sidedata:

              rawtext.append(value)

          rawtext.append(bytes(text))

        Augie Fackler
    
formatting: byteify all mercurial/ and hgext/ string literals...

              r43347
            
          return b''.join(rawtext), False

        marmoute
    
sidedata: add a function to write sidedata into a raw text...

              r43303
            
        Augie Fackler
    
formatting: blacken the codebase...

              r43346
            
        marmoute
    
sidedata: add a function to read sidedata from revlog raw text...

              r43302
            
      def sidedatareadprocessor(rl, text):

          sidedata = {}

          offset = 0

        Augie Fackler
    
formatting: blacken the codebase...

              r43346
            
          (nbentry,) = SIDEDATA_HEADER.unpack(text[: SIDEDATA_HEADER.size])

        marmoute
    
sidedata: add a function to read sidedata from revlog raw text...

              r43302
            
          offset += SIDEDATA_HEADER.size

          dataoffset = SIDEDATA_HEADER.size + (SIDEDATA_ENTRY.size * nbentry)

          for i in range(nbentry):

              nextoffset = offset + SIDEDATA_ENTRY.size

              key, size, storeddigest = SIDEDATA_ENTRY.unpack(text[offset:nextoffset])

              offset = nextoffset

              # read the data associated with that entry

              nextdataoffset = dataoffset + size

              entrytext = text[dataoffset:nextdataoffset]

              readdigest = hashlib.sha1(entrytext).digest()

              if storeddigest != readdigest:

                  raise error.SidedataHashError(key, storeddigest, readdigest)

              sidedata[key] = entrytext

              dataoffset = nextdataoffset

          text = text[dataoffset:]

          return text, True, sidedata

        marmoute
    
sidedata: add a function for _processflagsraw usage...

              r43304
            
        Augie Fackler
    
formatting: blacken the codebase...

              r43346
            
        marmoute
    
sidedata: add a function for _processflagsraw usage...

              r43304
            
      def sidedatarawprocessor(rl, text):

          # side data modifies rawtext and prevent rawtext hash validation

          return False

        marmoute
    
sidedata: register the flag processors if the repository allows for it...

              r43305
            
        Augie Fackler
    
formatting: blacken the codebase...

              r43346
            
        marmoute
    
sidedata: register the flag processors if the repository allows for it...

              r43305
            
      processors = (

          sidedatareadprocessor,

          sidedatawriteprocessor,

          sidedatarawprocessor,

      )

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

marmoute sidedata: add a new module with basic documentation...	r43301	# sidedata.py - Logic around store extra data alongside revlog revisions
		#
		# Copyright 2019 Pierre-Yves David <pierre-yves.david@octobus.net)
		#
		# This software may be used and distributed according to the terms of the
		# GNU General Public License version 2 or any later version.
		"""core code for "sidedata" support

		The "sidedata" are stored alongside the revision without actually being part of
		its content and not affecting its hash. It's main use cases is to cache
		important information related to a changesets.

		The current implementation is experimental and subject to changes. Do not rely
		on it in production.

		Sidedata are stored in the revlog itself, withing the revision rawtext. They
		are inserted, removed from it using the flagprocessors mechanism. The following
		format is currently used::

		initial header:
		<number of sidedata; 2 bytes>
		sidedata (repeated N times):
		<sidedata-key; 2 bytes>
		<sidedata-entry-length: 4 bytes>
		<sidedata-content-sha1-digest: 20 bytes>
		<sidedata-content; X bytes>
		normal raw text:
		<all bytes remaining in the rawtext>

		This is a simple and effective format. It should be enought to experiment with
		the concept.
		"""

		from __future__ import absolute_import
marmoute sidedata: add a function to read sidedata from revlog raw text...	r43302
		import hashlib
		import struct

		from .. import error

marmoute sidedata: test we can successfully write sidedata...	r43308	## sidedata type constant
		# reserve a block for testing purposes.
		SD_TEST1 = 1
		SD_TEST2 = 2
		SD_TEST3 = 3
		SD_TEST4 = 4
		SD_TEST5 = 5
		SD_TEST6 = 6
		SD_TEST7 = 7

marmoute sidedatacopies: write copies information in sidedata when applicable...	r43412	# key to store copies related information
		SD_P1COPIES = 8
		SD_P2COPIES = 9
		SD_FILESADDED = 10
		SD_FILESREMOVED = 11

marmoute sidedata: test we can successfully write sidedata...	r43308	# internal format constant
marmoute sidedata: adjust string for python3...	r43318	SIDEDATA_HEADER = struct.Struct(r'>H')
		SIDEDATA_ENTRY = struct.Struct(r'>HL20s')
marmoute sidedata: add a function to read sidedata from revlog raw text...	r43302
Augie Fackler formatting: blacken the codebase...	r43346
marmoute sidedata: add a function to write sidedata into a raw text...	r43303	def sidedatawriteprocessor(rl, text, sidedata):
		sidedata = list(sidedata.items())
		sidedata.sort()
		rawtext = [SIDEDATA_HEADER.pack(len(sidedata))]
		for key, value in sidedata:
		digest = hashlib.sha1(value).digest()
		rawtext.append(SIDEDATA_ENTRY.pack(key, len(value), digest))
		for key, value in sidedata:
		rawtext.append(value)
		rawtext.append(bytes(text))
Augie Fackler formatting: byteify all mercurial/ and hgext/ string literals...	r43347	return b''.join(rawtext), False
marmoute sidedata: add a function to write sidedata into a raw text...	r43303
Augie Fackler formatting: blacken the codebase...	r43346
marmoute sidedata: add a function to read sidedata from revlog raw text...	r43302	def sidedatareadprocessor(rl, text):
		sidedata = {}
		offset = 0
Augie Fackler formatting: blacken the codebase...	r43346	(nbentry,) = SIDEDATA_HEADER.unpack(text[: SIDEDATA_HEADER.size])
marmoute sidedata: add a function to read sidedata from revlog raw text...	r43302	offset += SIDEDATA_HEADER.size
		dataoffset = SIDEDATA_HEADER.size + (SIDEDATA_ENTRY.size * nbentry)
		for i in range(nbentry):
		nextoffset = offset + SIDEDATA_ENTRY.size
		key, size, storeddigest = SIDEDATA_ENTRY.unpack(text[offset:nextoffset])
		offset = nextoffset
		# read the data associated with that entry
		nextdataoffset = dataoffset + size
		entrytext = text[dataoffset:nextdataoffset]
		readdigest = hashlib.sha1(entrytext).digest()
		if storeddigest != readdigest:
		raise error.SidedataHashError(key, storeddigest, readdigest)
		sidedata[key] = entrytext
		dataoffset = nextdataoffset
		text = text[dataoffset:]
		return text, True, sidedata
marmoute sidedata: add a function for _processflagsraw usage...	r43304
Augie Fackler formatting: blacken the codebase...	r43346
marmoute sidedata: add a function for _processflagsraw usage...	r43304	def sidedatarawprocessor(rl, text):
		# side data modifies rawtext and prevent rawtext hash validation
		return False
marmoute sidedata: register the flag processors if the repository allows for it...	r43305
Augie Fackler formatting: blacken the codebase...	r43346
marmoute sidedata: register the flag processors if the repository allows for it...	r43305	processors = (
		sidedatareadprocessor,
		sidedatawriteprocessor,
		sidedatarawprocessor,
		)