upstream/mercurial-mirror Files · mercurial/revlogutils/sidedata.py

mail: add type hints for pytype...

mail: add type hints for pytype We essentially annotate functions in which handling of bytes/str is not obvious in order to hopefully clear things out. See also changeset introducing typing hints in Mercurial. Most types are straightforward but a few is wrong, and we need to either disable pytype on respective instructions or use wrong annotations. These will be fixed in next changesets. Notice the type Union[bytes, str] of "s" parameter of headencode(), this reflects how email.header.Header.append() behaves.

Augie Fackler - - Load All Authors

File last commit:

r43812:2fe6121c default


                r44024:8d9e2c2b

default

Download file

             sidedata.py
        
                    106 lines
            
             | 3.2 KiB
            
                | text/x-python
            
             |
                PythonLexer
            
             / mercurial / revlogutils / sidedata.py
          
                    History
                
                 |
                  Source
                 | Raw
                 |Copy content
                 |Copy permalink

        marmoute
    
sidedata: add a new module with basic documentation...

              r43301
            
      # sidedata.py - Logic around store extra data alongside revlog revisions

      #

      # Copyright 2019 Pierre-Yves David <pierre-yves.david@octobus.net)

      #

      # This software may be used and distributed according to the terms of the

      # GNU General Public License version 2 or any later version.

      """core code for "sidedata" support

      The "sidedata" are stored alongside the revision without actually being part of

      its content and not affecting its hash. It's main use cases is to cache

      important information related to a changesets.

      The current implementation is experimental and subject to changes. Do not rely

      on it in production.

      Sidedata are stored in the revlog itself, withing the revision rawtext. They

      are inserted, removed from it using the flagprocessors mechanism. The following

      format is currently used::

          initial header:

              <number of sidedata; 2 bytes>

          sidedata (repeated N times):

              <sidedata-key; 2 bytes>

              <sidedata-entry-length: 4 bytes>

              <sidedata-content-sha1-digest: 20 bytes>

              <sidedata-content; X bytes>

          normal raw text:

              <all bytes remaining in the rawtext>

      This is a simple and effective format. It should be enought to experiment with

      the concept.

      """

      from __future__ import absolute_import

        marmoute
    
sidedata: add a function to read sidedata from revlog raw text...

              r43302
            
      import hashlib

      import struct

      from .. import error

        marmoute
    
sidedata: test we can successfully write sidedata...

              r43308
            
      ## sidedata type constant

      # reserve a block for testing purposes.

      SD_TEST1 = 1

      SD_TEST2 = 2

      SD_TEST3 = 3

      SD_TEST4 = 4

      SD_TEST5 = 5

      SD_TEST6 = 6

      SD_TEST7 = 7

        marmoute
    
sidedatacopies: write copies information in sidedata when applicable...

              r43412
            
      # key to store copies related information

      SD_P1COPIES = 8

      SD_P2COPIES = 9

      SD_FILESADDED = 10

      SD_FILESREMOVED = 11

        marmoute
    
sidedata: test we can successfully write sidedata...

              r43308
            
      # internal format constant

        Augie Fackler
    
cleanup: remove pointless r-prefixes on single-quoted strings...

              r43906
            
      SIDEDATA_HEADER = struct.Struct('>H')

      SIDEDATA_ENTRY = struct.Struct('>HL20s')

        marmoute
    
sidedata: add a function to read sidedata from revlog raw text...

              r43302
            
        Augie Fackler
    
formatting: blacken the codebase...

              r43346
            
        marmoute
    
sidedata: add a function to write sidedata into a raw text...

              r43303
            
      def sidedatawriteprocessor(rl, text, sidedata):

          sidedata = list(sidedata.items())

          sidedata.sort()

          rawtext = [SIDEDATA_HEADER.pack(len(sidedata))]

          for key, value in sidedata:

              digest = hashlib.sha1(value).digest()

              rawtext.append(SIDEDATA_ENTRY.pack(key, len(value), digest))

          for key, value in sidedata:

              rawtext.append(value)

          rawtext.append(bytes(text))

        Augie Fackler
    
formatting: byteify all mercurial/ and hgext/ string literals...

              r43347
            
          return b''.join(rawtext), False

        marmoute
    
sidedata: add a function to write sidedata into a raw text...

              r43303
            
        Augie Fackler
    
formatting: blacken the codebase...

              r43346
            
        marmoute
    
sidedata: add a function to read sidedata from revlog raw text...

              r43302
            
      def sidedatareadprocessor(rl, text):

          sidedata = {}

          offset = 0

        Augie Fackler
    
formatting: blacken the codebase...

              r43346
            
          (nbentry,) = SIDEDATA_HEADER.unpack(text[: SIDEDATA_HEADER.size])

        marmoute
    
sidedata: add a function to read sidedata from revlog raw text...

              r43302
            
          offset += SIDEDATA_HEADER.size

          dataoffset = SIDEDATA_HEADER.size + (SIDEDATA_ENTRY.size * nbentry)

          for i in range(nbentry):

              nextoffset = offset + SIDEDATA_ENTRY.size

              key, size, storeddigest = SIDEDATA_ENTRY.unpack(text[offset:nextoffset])

              offset = nextoffset

              # read the data associated with that entry

              nextdataoffset = dataoffset + size

              entrytext = text[dataoffset:nextdataoffset]

              readdigest = hashlib.sha1(entrytext).digest()

              if storeddigest != readdigest:

                  raise error.SidedataHashError(key, storeddigest, readdigest)

              sidedata[key] = entrytext

              dataoffset = nextdataoffset

          text = text[dataoffset:]

          return text, True, sidedata

        marmoute
    
sidedata: add a function for _processflagsraw usage...

              r43304
            
        Augie Fackler
    
formatting: blacken the codebase...

              r43346
            
        marmoute
    
sidedata: add a function for _processflagsraw usage...

              r43304
            
      def sidedatarawprocessor(rl, text):

          # side data modifies rawtext and prevent rawtext hash validation

          return False

        marmoute
    
sidedata: register the flag processors if the repository allows for it...

              r43305
            
        Augie Fackler
    
formatting: blacken the codebase...

              r43346
            
        marmoute
    
sidedata: register the flag processors if the repository allows for it...

              r43305
            
      processors = (

          sidedatareadprocessor,

          sidedatawriteprocessor,

          sidedatarawprocessor,

      )

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

marmoute sidedata: add a new module with basic documentation...	r43301	# sidedata.py - Logic around store extra data alongside revlog revisions
		#
		# Copyright 2019 Pierre-Yves David <pierre-yves.david@octobus.net)
		#
		# This software may be used and distributed according to the terms of the
		# GNU General Public License version 2 or any later version.
		"""core code for "sidedata" support

		The "sidedata" are stored alongside the revision without actually being part of
		its content and not affecting its hash. It's main use cases is to cache
		important information related to a changesets.

		The current implementation is experimental and subject to changes. Do not rely
		on it in production.

		Sidedata are stored in the revlog itself, withing the revision rawtext. They
		are inserted, removed from it using the flagprocessors mechanism. The following
		format is currently used::

		initial header:
		<number of sidedata; 2 bytes>
		sidedata (repeated N times):
		<sidedata-key; 2 bytes>
		<sidedata-entry-length: 4 bytes>
		<sidedata-content-sha1-digest: 20 bytes>
		<sidedata-content; X bytes>
		normal raw text:
		<all bytes remaining in the rawtext>

		This is a simple and effective format. It should be enought to experiment with
		the concept.
		"""

		from __future__ import absolute_import
marmoute sidedata: add a function to read sidedata from revlog raw text...	r43302
		import hashlib
		import struct

		from .. import error

marmoute sidedata: test we can successfully write sidedata...	r43308	## sidedata type constant
		# reserve a block for testing purposes.
		SD_TEST1 = 1
		SD_TEST2 = 2
		SD_TEST3 = 3
		SD_TEST4 = 4
		SD_TEST5 = 5
		SD_TEST6 = 6
		SD_TEST7 = 7

marmoute sidedatacopies: write copies information in sidedata when applicable...	r43412	# key to store copies related information
		SD_P1COPIES = 8
		SD_P2COPIES = 9
		SD_FILESADDED = 10
		SD_FILESREMOVED = 11

marmoute sidedata: test we can successfully write sidedata...	r43308	# internal format constant
Augie Fackler cleanup: remove pointless r-prefixes on single-quoted strings...	r43906	SIDEDATA_HEADER = struct.Struct('>H')
		SIDEDATA_ENTRY = struct.Struct('>HL20s')
marmoute sidedata: add a function to read sidedata from revlog raw text...	r43302
Augie Fackler formatting: blacken the codebase...	r43346
marmoute sidedata: add a function to write sidedata into a raw text...	r43303	def sidedatawriteprocessor(rl, text, sidedata):
		sidedata = list(sidedata.items())
		sidedata.sort()
		rawtext = [SIDEDATA_HEADER.pack(len(sidedata))]
		for key, value in sidedata:
		digest = hashlib.sha1(value).digest()
		rawtext.append(SIDEDATA_ENTRY.pack(key, len(value), digest))
		for key, value in sidedata:
		rawtext.append(value)
		rawtext.append(bytes(text))
Augie Fackler formatting: byteify all mercurial/ and hgext/ string literals...	r43347	return b''.join(rawtext), False
marmoute sidedata: add a function to write sidedata into a raw text...	r43303
Augie Fackler formatting: blacken the codebase...	r43346
marmoute sidedata: add a function to read sidedata from revlog raw text...	r43302	def sidedatareadprocessor(rl, text):
		sidedata = {}
		offset = 0
Augie Fackler formatting: blacken the codebase...	r43346	(nbentry,) = SIDEDATA_HEADER.unpack(text[: SIDEDATA_HEADER.size])
marmoute sidedata: add a function to read sidedata from revlog raw text...	r43302	offset += SIDEDATA_HEADER.size
		dataoffset = SIDEDATA_HEADER.size + (SIDEDATA_ENTRY.size * nbentry)
		for i in range(nbentry):
		nextoffset = offset + SIDEDATA_ENTRY.size
		key, size, storeddigest = SIDEDATA_ENTRY.unpack(text[offset:nextoffset])
		offset = nextoffset
		# read the data associated with that entry
		nextdataoffset = dataoffset + size
		entrytext = text[dataoffset:nextdataoffset]
		readdigest = hashlib.sha1(entrytext).digest()
		if storeddigest != readdigest:
		raise error.SidedataHashError(key, storeddigest, readdigest)
		sidedata[key] = entrytext
		dataoffset = nextdataoffset
		text = text[dataoffset:]
		return text, True, sidedata
marmoute sidedata: add a function for _processflagsraw usage...	r43304
Augie Fackler formatting: blacken the codebase...	r43346
marmoute sidedata: add a function for _processflagsraw usage...	r43304	def sidedatarawprocessor(rl, text):
		# side data modifies rawtext and prevent rawtext hash validation
		return False
marmoute sidedata: register the flag processors if the repository allows for it...	r43305
Augie Fackler formatting: blacken the codebase...	r43346
marmoute sidedata: register the flag processors if the repository allows for it...	r43305	processors = (
		sidedatareadprocessor,
		sidedatawriteprocessor,
		sidedatarawprocessor,
		)