upstream/mercurial-mirror Files · mercurial/changegroup.py

chunkiter: handle large reads more efficiently...

chunkiter: handle large reads more efficiently - for large reads, don't attempt to read more than necessary - if we've gathered the exact number of bytes needed, avoid a string copy

Matt Mackall - - Load All Authors

File last commit:

r5368:61462e7d default


                r5449:17a4b20e

default

Download file

             changegroup.py
        
                    122 lines
            
             | 3.5 KiB
            
                | text/x-python
            
             |
                PythonLexer
            
             / mercurial / changegroup.py
          
                    History
                
                 |
                  Annotation
                 | Raw
                 |Copy content
                 |Copy permalink

      """

      changegroup.py - Mercurial changegroup manipulation functions

       Copyright 2006 Matt Mackall <mpm@selenic.com>

      This software may be used and distributed according to the terms

      of the GNU General Public License, incorporated herein by reference.

      """

      from i18n import _

      import struct, os, bz2, zlib, util, tempfile

      def getchunk(source):

          """get a chunk from a changegroup"""

          d = source.read(4)

          if not d:

              return ""

          l = struct.unpack(">l", d)[0]

          if l <= 4:

              return ""

          d = source.read(l - 4)

          if len(d) < l - 4:

              raise util.Abort(_("premature EOF reading chunk"

                                 " (got %d bytes, expected %d)")

                                % (len(d), l - 4))

          return d

      def chunkiter(source):

          """iterate through the chunks in source"""

          while 1:

              c = getchunk(source)

              if not c:

                  break

              yield c

      def chunkheader(length):

          """build a changegroup chunk header"""

          return struct.pack(">l", length + 4)

      def closechunk():

          return struct.pack(">l", 0)

      class nocompress(object):

          def compress(self, x):

              return x

          def flush(self):

              return ""

      bundletypes = {

          "": ("", nocompress),

          "HG10UN": ("HG10UN", nocompress),

          "HG10BZ": ("HG10", lambda: bz2.BZ2Compressor()),

          "HG10GZ": ("HG10GZ", lambda: zlib.compressobj()),

      }

      def writebundle(cg, filename, bundletype):

          """Write a bundle file and return its filename.

          Existing files will not be overwritten.

          If no filename is specified, a temporary file is created.

          bz2 compression can be turned off.

          The bundle file will be deleted in case of errors.

          """

          fh = None

          cleanup = None

          try:

              if filename:

                  fh = open(filename, "wb")

              else:

                  fd, filename = tempfile.mkstemp(prefix="hg-bundle-", suffix=".hg")

                  fh = os.fdopen(fd, "wb")

              cleanup = filename

              header, compressor = bundletypes[bundletype]

              fh.write(header)

              z = compressor()

              # parse the changegroup data, otherwise we will block

              # in case of sshrepo because we don't know the end of the stream

              # an empty chunkiter is the end of the changegroup

              empty = False

              while not empty:

                  empty = True

                  for chunk in chunkiter(cg):

                      empty = False

                      fh.write(z.compress(chunkheader(len(chunk))))

                      pos = 0

                      while pos < len(chunk):

                          next = pos + 2**20

                          fh.write(z.compress(chunk[pos:next]))

                          pos = next

                  fh.write(z.compress(closechunk()))

              fh.write(z.flush())

              cleanup = None

              return filename

          finally:

              if fh is not None:

                  fh.close()

              if cleanup is not None:

                  os.unlink(cleanup)

      def readbundle(fh, fname):

          header = fh.read(6)

          if not header.startswith("HG"):

              raise util.Abort(_("%s: not a Mercurial bundle file") % fname)

          elif not header.startswith("HG10"):

              raise util.Abort(_("%s: unknown bundle version") % fname)

          if header == "HG10BZ":

              def generator(f):

                  zd = bz2.BZ2Decompressor()

                  zd.decompress("BZ")

                  for chunk in util.filechunkiter(f, 4096):

                      yield zd.decompress(chunk)

              return util.chunkbuffer(generator(fh))

          elif header == "HG10UN":

              return fh

          raise util.Abort(_("%s: unknown bundle compression type")

                           % fname)

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

				"""
				changegroup.py - Mercurial changegroup manipulation functions

				Copyright 2006 Matt Mackall <mpm@selenic.com>

				This software may be used and distributed according to the terms
				of the GNU General Public License, incorporated herein by reference.
				"""

				from i18n import _
				import struct, os, bz2, zlib, util, tempfile

				def getchunk(source):
				"""get a chunk from a changegroup"""
				d = source.read(4)
				if not d:
				return ""
				l = struct.unpack(">l", d)[0]
				if l <= 4:
				return ""
				d = source.read(l - 4)
				if len(d) < l - 4:
				raise util.Abort(_("premature EOF reading chunk"
				" (got %d bytes, expected %d)")
				% (len(d), l - 4))
				return d

				def chunkiter(source):
				"""iterate through the chunks in source"""
				while 1:
				c = getchunk(source)
				if not c:
				break
				yield c

				def chunkheader(length):
				"""build a changegroup chunk header"""
				return struct.pack(">l", length + 4)

				def closechunk():
				return struct.pack(">l", 0)

				class nocompress(object):
				def compress(self, x):
				return x
				def flush(self):
				return ""

				bundletypes = {
				"": ("", nocompress),
				"HG10UN": ("HG10UN", nocompress),
				"HG10BZ": ("HG10", lambda: bz2.BZ2Compressor()),
				"HG10GZ": ("HG10GZ", lambda: zlib.compressobj()),
				}

				def writebundle(cg, filename, bundletype):
				"""Write a bundle file and return its filename.

				Existing files will not be overwritten.
				If no filename is specified, a temporary file is created.
				bz2 compression can be turned off.
				The bundle file will be deleted in case of errors.
				"""

				fh = None
				cleanup = None
				try:
				if filename:
				fh = open(filename, "wb")
				else:
				fd, filename = tempfile.mkstemp(prefix="hg-bundle-", suffix=".hg")
				fh = os.fdopen(fd, "wb")
				cleanup = filename

				header, compressor = bundletypes[bundletype]
				fh.write(header)
				z = compressor()

				# parse the changegroup data, otherwise we will block
				# in case of sshrepo because we don't know the end of the stream

				# an empty chunkiter is the end of the changegroup
				empty = False
				while not empty:
				empty = True
				for chunk in chunkiter(cg):
				empty = False
				fh.write(z.compress(chunkheader(len(chunk))))
				pos = 0
				while pos < len(chunk):
				next = pos + 2**20
				fh.write(z.compress(chunk[pos:next]))
				pos = next
				fh.write(z.compress(closechunk()))
				fh.write(z.flush())
				cleanup = None
				return filename
				finally:
				if fh is not None:
				fh.close()
				if cleanup is not None:
				os.unlink(cleanup)

				def readbundle(fh, fname):
				header = fh.read(6)
				if not header.startswith("HG"):
				raise util.Abort(_("%s: not a Mercurial bundle file") % fname)
				elif not header.startswith("HG10"):
				raise util.Abort(_("%s: unknown bundle version") % fname)

				if header == "HG10BZ":
				def generator(f):
				zd = bz2.BZ2Decompressor()
				zd.decompress("BZ")
				for chunk in util.filechunkiter(f, 4096):
				yield zd.decompress(chunk)
				return util.chunkbuffer(generator(fh))
				elif header == "HG10UN":
				return fh

				raise util.Abort(_("%s: unknown bundle compression type")
				% fname)