upstream/mercurial-mirror Commit - r12041:270fb4d3

1

# changegroup.py - Mercurial changegroup manipulation functions

1

# changegroup.py - Mercurial changegroup manipulation functions

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

from i18n import _

8

from i18n import _

9

import util

9

import util

10

import struct, os, bz2, zlib, tempfile

10

import struct, os, bz2, zlib, tempfile

11

12

def getchunk(source):

12

def getchunk(source):

13

"""return the next chunk from changegroup 'source' as a string"""

13

"""return the next chunk from changegroup 'source' as a string"""

14

d = source.read(4)

14

d = source.read(4)

15

if not d:

15

if not d:

16

return ""

16

return ""

17

l = struct.unpack(">l", d)[0]

17

l = struct.unpack(">l", d)[0]

18

if l <= 4:

18

if l <= 4:

19

return ""

19

return ""

20

d = source.read(l - 4)

20

d = source.read(l - 4)

21

if len(d) < l - 4:

21

if len(d) < l - 4:

22

raise util.Abort(_("premature EOF reading chunk"

22

raise util.Abort(_("premature EOF reading chunk"

23

" (got %d bytes, expected %d)")

23

" (got %d bytes, expected %d)")

24

% (len(d), l - 4))

24

% (len(d), l - 4))

25

return d

25

return d

26

27

def chunkiter(source, progress=None):

27

def chunkiter(source, progress=None):

28

"""iterate through the chunks in source, yielding a sequence of chunks

28

"""iterate through the chunks in source, yielding a sequence of chunks

29

(strings)"""

29

(strings)"""

30

while 1:

30

while 1:

31

c = getchunk(source)

31

c = getchunk(source)

32

if not c:

32

if not c:

33

break

33

break

34

elif progress is not None:

34

elif progress is not None:

35

progress()

35

progress()

36

yield c

36

yield c

37

38

def chunkheader(length):

38

def chunkheader(length):

39

"""return a changegroup chunk header (string)"""

39

"""return a changegroup chunk header (string)"""

40

return struct.pack(">l", length + 4)

40

return struct.pack(">l", length + 4)

41

42

def closechunk():

42

def closechunk():

43

"""return a changegroup chunk header (string) for a zero-length chunk"""

43

"""return a changegroup chunk header (string) for a zero-length chunk"""

44

return struct.pack(">l", 0)

44

return struct.pack(">l", 0)

45

46

class nocompress(object):

46

class nocompress(object):

47

def compress(self, x):

47

def compress(self, x):

48

return x

48

return x

49

def flush(self):

49

def flush(self):

50

return ""

50

return ""

51

52

bundletypes = {

52

bundletypes = {

53

"": ("", nocompress),

53

"": ("", nocompress),

54

"HG10UN": ("HG10UN", nocompress),

54

"HG10UN": ("HG10UN", nocompress),

55

"HG10BZ": ("HG10", lambda: bz2.BZ2Compressor()),

55

"HG10BZ": ("HG10", lambda: bz2.BZ2Compressor()),

56

"HG10GZ": ("HG10GZ", lambda: zlib.compressobj()),

56

"HG10GZ": ("HG10GZ", lambda: zlib.compressobj()),

57

}

57

}

58

59

def collector(cl, mmfs, files):

59

def collector(cl, mmfs, files):

60

# Gather information about changeset nodes going out in a bundle.

60

# Gather information about changeset nodes going out in a bundle.

61

# We want to gather manifests needed and filelogs affected.

61

# We want to gather manifests needed and filelogs affected.

62

def collect(node):

62

def collect(node):

63

c = cl.read(node)

63

c = cl.read(node)

64

files.update(c[3])

64

files.update(c[3])

65

mmfs.setdefault(c[0], node)

65

mmfs.setdefault(c[0], node)

66

return collect

66

return collect

67

68

# hgweb uses this list to communicate its preferred type

68

# hgweb uses this list to communicate its preferred type

69

bundlepriority = ['HG10GZ', 'HG10BZ', 'HG10UN']

69

bundlepriority = ['HG10GZ', 'HG10BZ', 'HG10UN']

70

71

def writebundle(cg, filename, bundletype):

71

def writebundle(cg, filename, bundletype):

72

"""Write a bundle file and return its filename.

72

"""Write a bundle file and return its filename.

73

74

Existing files will not be overwritten.

74

Existing files will not be overwritten.

75

If no filename is specified, a temporary file is created.

75

If no filename is specified, a temporary file is created.

76

bz2 compression can be turned off.

76

bz2 compression can be turned off.

77

The bundle file will be deleted in case of errors.

77

The bundle file will be deleted in case of errors.

78

"""

78

"""

79

80

fh = None

80

fh = None

81

cleanup = None

81

cleanup = None

82

try:

82

try:

83

if filename:

83

if filename:

84

fh = open(filename, "wb")

84

fh = open(filename, "wb")

85

else:

85

else:

86

fd, filename = tempfile.mkstemp(prefix="hg-bundle-", suffix=".hg")

86

fd, filename = tempfile.mkstemp(prefix="hg-bundle-", suffix=".hg")

87

fh = os.fdopen(fd, "wb")

87

fh = os.fdopen(fd, "wb")

88

cleanup = filename

88

cleanup = filename

89

90

header, compressor = bundletypes[bundletype]

90

header, compressor = bundletypes[bundletype]

91

fh.write(header)

91

fh.write(header)

92

z = compressor()

92

z = compressor()

93

94

# parse the changegroup data, otherwise we will block

94

# parse the changegroup data, otherwise we will block

95

# in case of sshrepo because we don't know the end of the stream

95

# in case of sshrepo because we don't know the end of the stream

96

97

# an empty chunkiter is the end of the changegroup

97

# an empty chunkiter is the end of the changegroup

98

# a changegroup has at least 2 chunkiters (changelog and manifest).

98

# a changegroup has at least 2 chunkiters (changelog and manifest).

99

# after that, an empty chunkiter is the end of the changegroup

99

# after that, an empty chunkiter is the end of the changegroup

100

empty = False

100

empty = False

101

count = 0

101

count = 0

102

while not empty or count <= 2:

102

while not empty or count <= 2:

103

empty = True

103

empty = True

104

count += 1

104

count += 1

105

for chunk in chunkiter(cg):

105

for chunk in chunkiter(cg):

106

empty = False

106

empty = False

107

fh.write(z.compress(chunkheader(len(chunk))))

107

fh.write(z.compress(chunkheader(len(chunk))))

108

pos = 0

108

pos = 0

109

while pos < len(chunk):

109

while pos < len(chunk):

110

next = pos + 2**20

110

next = pos + 2**20

111

fh.write(z.compress(chunk[pos:next]))

111

fh.write(z.compress(chunk[pos:next]))

112

pos = next

112

pos = next

113

fh.write(z.compress(closechunk()))

113

fh.write(z.compress(closechunk()))

114

fh.write(z.flush())

114

fh.write(z.flush())

115

cleanup = None

115

cleanup = None

116

return filename

116

return filename

117

finally:

117

finally:

118

if fh is not None:

118

if fh is not None:

119

fh.close()

119

fh.close()

120

if cleanup is not None:

120

if cleanup is not None:

121

os.unlink(cleanup)

121

os.unlink(cleanup)

122

123

def unbundle(header, fh):

123

def decompressor(fh, alg):

124

if ~~header~~ == '~~HG10~~UN':

124

if alg == 'UN':

125

return fh

125

return fh

126

elif not header.startswith('HG'):

126

elif alg == 'GZ':

127

# old client with uncompressed bundle

128

def generator(f):

129

yield header

130

for chunk in f:

131

yield chunk

132

elif header == 'HG10GZ':

133

def generator(f):

127

def generator(f):

134

zd = zlib.decompressobj()

128

zd = zlib.decompressobj()

135

for chunk in f:

129

for chunk in f:

136

yield zd.decompress(chunk)

130

yield zd.decompress(chunk)

137

elif ~~header~~ == '~~HG10~~BZ':

131

elif alg == 'BZ':

138

def generator(f):

132

def generator(f):

139

zd = bz2.BZ2Decompressor()

133

zd = bz2.BZ2Decompressor()

140

zd.decompress("BZ")

134

zd.decompress("BZ")

141

for chunk in util.filechunkiter(f, 4096):

135

for chunk in util.filechunkiter(f, 4096):

142

yield zd.decompress(chunk)

136

yield zd.decompress(chunk)

143

return util.chunkbuffer(generator(fh))

137

else:

138

raise util.Abort("unknown bundle compression '%s'" % alg)

139

return generator(fh)

140

141

def unbundle(header, fh):

142

if not header.startswith('HG'):

143

def fixup(f, h):

144

yield h

145

for x in f:

146

yield x

147

fh = fixup(f, h)

148

header = "HG10UN"

149

150

alg = header[4:6]

151

return util.chunkbuffer(decompressor(fh, alg))

144

152

145

def readbundle(fh, fname):

153

def readbundle(fh, fname):

146

header = fh.read(6)

154

header = fh.read(6)

147

if not header.startswith('HG'):

155

if not header.startswith('HG'):

148

raise util.Abort(_('%s: not a Mercurial bundle file') % fname)

156

raise util.Abort(_('%s: not a Mercurial bundle file') % fname)

149

if not header.startswith('HG10'):

157

if not header.startswith('HG10'):

150

raise util.Abort(_('%s: unknown bundle version') % fname)

158

raise util.Abort(_('%s: unknown bundle version') % fname)

151

elif header not in bundletypes:

159

elif header not in bundletypes:

152

raise util.Abort(_('%s: unknown bundle compression type') % fname)

160

raise util.Abort(_('%s: unknown bundle compression type') % fname)

153

return unbundle(header, fh)

161

return unbundle(header, fh)

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # changegroup.py - Mercurial changegroup manipulation functions
             #
             #  Copyright 2006 Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from i18n import _
             import util
             import struct, os, bz2, zlib, tempfile
             def getchunk(source):
                 """return the next chunk from changegroup 'source' as a string"""
                 d = source.read(4)
                 if not d:
                     return ""
                 l = struct.unpack(">l", d)[0]
                 if l <= 4:
                     return ""
                 d = source.read(l - 4)
                 if len(d) < l - 4:
                     raise util.Abort(_("premature EOF reading chunk"
                                        " (got %d bytes, expected %d)")
                                       % (len(d), l - 4))
                 return d
             def chunkiter(source, progress=None):
                 """iterate through the chunks in source, yielding a sequence of chunks
                 (strings)"""
                 while 1:
                     c = getchunk(source)
                     if not c:
                         break
                     elif progress is not None:
                         progress()
                     yield c
             def chunkheader(length):
                 """return a changegroup chunk header (string)"""
                 return struct.pack(">l", length + 4)
             def closechunk():
                 """return a changegroup chunk header (string) for a zero-length chunk"""
                 return struct.pack(">l", 0)
             class nocompress(object):
                 def compress(self, x):
                     return x
                 def flush(self):
                     return ""
             bundletypes = {
                 "": ("", nocompress),
                 "HG10UN": ("HG10UN", nocompress),
                 "HG10BZ": ("HG10", lambda: bz2.BZ2Compressor()),
                 "HG10GZ": ("HG10GZ", lambda: zlib.compressobj()),
             }
             def collector(cl, mmfs, files):
                 # Gather information about changeset nodes going out in a bundle.
                 # We want to gather manifests needed and filelogs affected.
                 def collect(node):
                     c = cl.read(node)
                     files.update(c[3])
                     mmfs.setdefault(c[0], node)
                 return collect
             # hgweb uses this list to communicate its preferred type
             bundlepriority = ['HG10GZ', 'HG10BZ', 'HG10UN']
             def writebundle(cg, filename, bundletype):
                 """Write a bundle file and return its filename.
                 Existing files will not be overwritten.
                 If no filename is specified, a temporary file is created.
                 bz2 compression can be turned off.
                 The bundle file will be deleted in case of errors.
                 """
                 fh = None
                 cleanup = None
                 try:
                     if filename:
                         fh = open(filename, "wb")
                     else:
                         fd, filename = tempfile.mkstemp(prefix="hg-bundle-", suffix=".hg")
                         fh = os.fdopen(fd, "wb")
                     cleanup = filename
                     header, compressor = bundletypes[bundletype]
                     fh.write(header)
                     z = compressor()
                     # parse the changegroup data, otherwise we will block
                     # in case of sshrepo because we don't know the end of the stream
                     # an empty chunkiter is the end of the changegroup
                     # a changegroup has at least 2 chunkiters (changelog and manifest).
                     # after that, an empty chunkiter is the end of the changegroup
                     empty = False
                     count = 0
                     while not empty or count <= 2:
                         empty = True
                         count += 1
                         for chunk in chunkiter(cg):
                             empty = False
                             fh.write(z.compress(chunkheader(len(chunk))))
                             pos = 0
                             while pos < len(chunk):
                                 next = pos + 2**20
                                 fh.write(z.compress(chunk[pos:next]))
                                 pos = next
                         fh.write(z.compress(closechunk()))
                     fh.write(z.flush())
                     cleanup = None
                     return filename
                 finally:
                     if fh is not None:
                         fh.close()
                     if cleanup is not None:
                         os.unlink(cleanup)
-            def unbundle(header, fh):
+            def decompressor(fh, alg):
-                if header == 'HG10UN':
+                if alg == 'UN':
                     return fh
-                elif not header.startswith('HG'):
+                elif alg == 'GZ':
-                    # old client with uncompressed bundle
-                    def generator(f):
-                        yield header
-                        for chunk in f:
-                            yield chunk
-                elif header == 'HG10GZ':
                     def generator(f):
                         zd = zlib.decompressobj()
                         for chunk in f:
                             yield zd.decompress(chunk)
-                elif header == 'HG10BZ':
+                elif alg == 'BZ':
                     def generator(f):
                         zd = bz2.BZ2Decompressor()
                         zd.decompress("BZ")
                         for chunk in util.filechunkiter(f, 4096):
                             yield zd.decompress(chunk)
-                return util.chunkbuffer(generator(fh))
+                else:
+                    raise util.Abort("unknown bundle compression '%s'" % alg)
+                return generator(fh)
+            def unbundle(header, fh):
+                if not header.startswith('HG'):
+                    def fixup(f, h):
+                        yield h
+                        for x in f:
+                            yield x
+                    fh = fixup(f, h)
+                    header = "HG10UN"
+                alg = header[4:6]
+                return util.chunkbuffer(decompressor(fh, alg))
             def readbundle(fh, fname):
                 header = fh.read(6)
                 if not header.startswith('HG'):
                     raise util.Abort(_('%s: not a Mercurial bundle file') % fname)
                 if not header.startswith('HG10'):
                     raise util.Abort(_('%s: unknown bundle version') % fname)
                 elif header not in bundletypes:
                     raise util.Abort(_('%s: unknown bundle compression type') % fname)
                 return unbundle(header, fh)