upstream/mercurial-mirror Commit - r31652:d5cbbee5

1

2

3

4

5

#

5

#

6

# This software may be used and distributed according to the terms of the

6

# This software may be used and distributed according to the terms of the

7

# GNU General Public License version 2 or any later version.

7

# GNU General Public License version 2 or any later version.

8

9

'''largefiles utility code: must not import other modules in this package.'''

9

'''largefiles utility code: must not import other modules in this package.'''

10

from __future__ import absolute_import

10

from __future__ import absolute_import

11

12

import copy

12

import copy

13

import hashlib

13

import hashlib

14

import os

14

import os

15

import platform

15

import platform

16

import stat

16

import stat

17

18

from mercurial.i18n import _

18

from mercurial.i18n import _

19

20

from mercurial import (

20

from mercurial import (

21

dirstate,

21

dirstate,

22

encoding,

22

encoding,

23

error,

23

error,

24

httpconnection,

24

httpconnection,

25

match as matchmod,

25

match as matchmod,

26

node,

26

node,

27

pycompat,

27

pycompat,

28

scmutil,

28

scmutil,

29

util,

29

util,

30

vfs as vfsmod,

30

vfs as vfsmod,

31

)

31

)

32

33

shortname = '.hglf'

33

shortname = '.hglf'

34

shortnameslash = shortname + '/'

34

shortnameslash = shortname + '/'

35

longname = 'largefiles'

35

longname = 'largefiles'

36

37

# -- Private worker functions ------------------------------------------

37

# -- Private worker functions ------------------------------------------

38

39

def getminsize(ui, assumelfiles, opt, default=10):

39

def getminsize(ui, assumelfiles, opt, default=10):

40

lfsize = opt

40

lfsize = opt

41

if not lfsize and assumelfiles:

41

if not lfsize and assumelfiles:

42

lfsize = ui.config(longname, 'minsize', default=default)

42

lfsize = ui.config(longname, 'minsize', default=default)

43

if lfsize:

43

if lfsize:

44

try:

44

try:

45

lfsize = float(lfsize)

45

lfsize = float(lfsize)

46

except ValueError:

46

except ValueError:

47

raise error.Abort(_('largefiles: size must be number (not %s)\n')

47

raise error.Abort(_('largefiles: size must be number (not %s)\n')

48

% lfsize)

48

% lfsize)

49

if lfsize is None:

49

if lfsize is None:

50

raise error.Abort(_('minimum size for largefiles must be specified'))

50

raise error.Abort(_('minimum size for largefiles must be specified'))

51

return lfsize

51

return lfsize

52

53

def link(src, dest):

53

def link(src, dest):

54

"""Try to create hardlink - if that fails, efficiently make a copy."""

54

"""Try to create hardlink - if that fails, efficiently make a copy."""

55

util.makedirs(os.path.dirname(dest))

55

util.makedirs(os.path.dirname(dest))

56

try:

56

try:

57

util.oslink(src, dest)

57

util.oslink(src, dest)

58

except OSError:

58

except OSError:

59

# if hardlinks fail, fallback on atomic copy

59

# if hardlinks fail, fallback on atomic copy

60

with open(src, 'rb') as srcf:

60

with open(src, 'rb') as srcf:

61

with util.atomictempfile(dest) as dstf:

61

with util.atomictempfile(dest) as dstf:

62

for chunk in util.filechunkiter(srcf):

62

for chunk in util.filechunkiter(srcf):

63

dstf.write(chunk)

63

dstf.write(chunk)

64

os.chmod(dest, os.stat(src).st_mode)

64

os.chmod(dest, os.stat(src).st_mode)

65

66

def usercachepath(ui, hash):

66

def usercachepath(ui, hash):

67

'''Return the correct location in the "global" largefiles cache for a file

67

'''Return the correct location in the "global" largefiles cache for a file

68

with the given hash.

68

with the given hash.

69

This cache is used for sharing of largefiles across repositories - both

69

This cache is used for sharing of largefiles across repositories - both

70

to preserve download bandwidth and storage space.'''

70

to preserve download bandwidth and storage space.'''

71

return os.path.join(_usercachedir(ui), hash)

71

return os.path.join(_usercachedir(ui), hash)

72

73

def _usercachedir(ui):

73

def _usercachedir(ui):

74

'''Return the location of the "global" largefiles cache.'''

74

'''Return the location of the "global" largefiles cache.'''

75

path = ui.configpath(longname, 'usercache', None)

75

path = ui.configpath(longname, 'usercache', None)

76

if path:

76

if path:

77

return path

77

return path

78

if pycompat.osname == 'nt':

78

if pycompat.osname == 'nt':

79

appdata = encoding.environ.get('LOCALAPPDATA',\

79

appdata = encoding.environ.get('LOCALAPPDATA',\

80

encoding.environ.get('APPDATA'))

80

encoding.environ.get('APPDATA'))

81

if appdata:

81

if appdata:

82

return os.path.join(appdata, longname)

82

return os.path.join(appdata, longname)

83

elif platform.system() == 'Darwin':

83

elif platform.system() == 'Darwin':

84

home = encoding.environ.get('HOME')

84

home = encoding.environ.get('HOME')

85

if home:

85

if home:

86

return os.path.join(home, 'Library', 'Caches', longname)

86

return os.path.join(home, 'Library', 'Caches', longname)

87

elif pycompat.osname == 'posix':

87

elif pycompat.osname == 'posix':

88

path = encoding.environ.get('XDG_CACHE_HOME')

88

path = encoding.environ.get('XDG_CACHE_HOME')

89

if path:

89

if path:

90

return os.path.join(path, longname)

90

return os.path.join(path, longname)

91

home = encoding.environ.get('HOME')

91

home = encoding.environ.get('HOME')

92

if home:

92

if home:

93

return os.path.join(home, '.cache', longname)

93

return os.path.join(home, '.cache', longname)

94

else:

94

else:

95

raise error.Abort(_('unknown operating system: %s\n')

95

raise error.Abort(_('unknown operating system: %s\n')

96

% pycompat.osname)

96

% pycompat.osname)

97

raise error.Abort(_('unknown %s usercache location') % longname)

97

raise error.Abort(_('unknown %s usercache location') % longname)

98

99

def inusercache(ui, hash):

99

def inusercache(ui, hash):

100

path = usercachepath(ui, hash)

100

path = usercachepath(ui, hash)

101

return os.path.exists(path)

101

return os.path.exists(path)

102

103

def findfile(repo, hash):

103

def findfile(repo, hash):

104

'''Return store path of the largefile with the specified hash.

104

'''Return store path of the largefile with the specified hash.

105

As a side effect, the file might be linked from user cache.

105

As a side effect, the file might be linked from user cache.

106

Return None if the file can't be found locally.'''

106

Return None if the file can't be found locally.'''

107

path, exists = findstorepath(repo, hash)

107

path, exists = findstorepath(repo, hash)

108

if exists:

108

if exists:

109

repo.ui.note(_('found %s in store\n') % hash)

109

repo.ui.note(_('found %s in store\n') % hash)

110

return path

110

return path

111

elif inusercache(repo.ui, hash):

111

elif inusercache(repo.ui, hash):

112

repo.ui.note(_('found %s in system cache\n') % hash)

112

repo.ui.note(_('found %s in system cache\n') % hash)

113

path = storepath(repo, hash)

113

path = storepath(repo, hash)

114

link(usercachepath(repo.ui, hash), path)

114

link(usercachepath(repo.ui, hash), path)

115

return path

115

return path

116

return None

116

return None

117

118

class largefilesdirstate(dirstate.dirstate):

118

class largefilesdirstate(dirstate.dirstate):

119

def __getitem__(self, key):

119

def __getitem__(self, key):

120

return super(largefilesdirstate, self).__getitem__(unixpath(key))

120

return super(largefilesdirstate, self).__getitem__(unixpath(key))

121

def normal(self, f):

121

def normal(self, f):

122

return super(largefilesdirstate, self).normal(unixpath(f))

122

return super(largefilesdirstate, self).normal(unixpath(f))

123

def remove(self, f):

123

def remove(self, f):

124

return super(largefilesdirstate, self).remove(unixpath(f))

124

return super(largefilesdirstate, self).remove(unixpath(f))

125

def add(self, f):

125

def add(self, f):

126

return super(largefilesdirstate, self).add(unixpath(f))

126

return super(largefilesdirstate, self).add(unixpath(f))

127

def drop(self, f):

127

def drop(self, f):

128

return super(largefilesdirstate, self).drop(unixpath(f))

128

return super(largefilesdirstate, self).drop(unixpath(f))

129

def forget(self, f):

129

def forget(self, f):

130

return super(largefilesdirstate, self).forget(unixpath(f))

130

return super(largefilesdirstate, self).forget(unixpath(f))

131

def normallookup(self, f):

131

def normallookup(self, f):

132

return super(largefilesdirstate, self).normallookup(unixpath(f))

132

return super(largefilesdirstate, self).normallookup(unixpath(f))

133

def _ignore(self, f):

133

def _ignore(self, f):

134

return False

134

return False

135

def write(self, tr=False):

135

def write(self, tr=False):

136

# (1) disable PENDING mode always

136

# (1) disable PENDING mode always

137

# (lfdirstate isn't yet managed as a part of the transaction)

137

# (lfdirstate isn't yet managed as a part of the transaction)

138

# (2) avoid develwarn 'use dirstate.write with ....'

138

# (2) avoid develwarn 'use dirstate.write with ....'

139

super(largefilesdirstate, self).write(None)

139

super(largefilesdirstate, self).write(None)

140

141

def openlfdirstate(ui, repo, create=True):

141

def openlfdirstate(ui, repo, create=True):

142

'''

142

'''

143

Return a dirstate object that tracks largefiles: i.e. its root is

143

Return a dirstate object that tracks largefiles: i.e. its root is

144

the repo root, but it is saved in .hg/largefiles/dirstate.

144

the repo root, but it is saved in .hg/largefiles/dirstate.

145

'''

145

'''

146

vfs = repo.vfs

146

vfs = repo.vfs

147

lfstoredir = longname

147

lfstoredir = longname

148

opener = vfsmod.vfs(vfs.join(lfstoredir))

148

opener = vfsmod.vfs(vfs.join(lfstoredir))

149

lfdirstate = largefilesdirstate(opener, ui, repo.root,

149

lfdirstate = largefilesdirstate(opener, ui, repo.root,

150

repo.dirstate._validate)

150

repo.dirstate._validate)

151

152

# If the largefiles dirstate does not exist, populate and create

152

# If the largefiles dirstate does not exist, populate and create

153

# it. This ensures that we create it on the first meaningful

153

# it. This ensures that we create it on the first meaningful

154

# largefiles operation in a new clone.

154

# largefiles operation in a new clone.

155

if create and not vfs.exists(vfs.join(lfstoredir, 'dirstate')):

155

if create and not vfs.exists(vfs.join(lfstoredir, 'dirstate')):

156

matcher = getstandinmatcher(repo)

156

matcher = getstandinmatcher(repo)

157

standins = repo.dirstate.walk(matcher, [], False, False)

157

standins = repo.dirstate.walk(matcher, [], False, False)

158

159

if len(standins) > 0:

159

if len(standins) > 0:

160

vfs.makedirs(lfstoredir)

160

vfs.makedirs(lfstoredir)

161

162

for standin in standins:

162

for standin in standins:

163

lfile = splitstandin(standin)

163

lfile = splitstandin(standin)

164

lfdirstate.normallookup(lfile)

164

lfdirstate.normallookup(lfile)

165

return lfdirstate

165

return lfdirstate

166

167

def lfdirstatestatus(lfdirstate, repo):

167

def lfdirstatestatus(lfdirstate, repo):

168

wctx = repo['.']

168

wctx = repo['.']

169

match = matchmod.always(repo.root, repo.getcwd())

169

match = matchmod.always(repo.root, repo.getcwd())

170

unsure, s = lfdirstate.status(match, [], False, False, False)

170

unsure, s = lfdirstate.status(match, [], False, False, False)

171

modified, clean = s.modified, s.clean

171

modified, clean = s.modified, s.clean

172

for lfile in unsure:

172

for lfile in unsure:

173

try:

173

try:

174

fctx = wctx[standin(lfile)]

174

fctx = wctx[standin(lfile)]

175

except LookupError:

175

except LookupError:

176

fctx = None

176

fctx = None

177

if not fctx or fctx.data().strip() != hashfile(repo.wjoin(lfile)):

177

if not fctx or fctx.data().strip() != hashfile(repo.wjoin(lfile)):

178

modified.append(lfile)

178

modified.append(lfile)

179

else:

179

else:

180

clean.append(lfile)

180

clean.append(lfile)

181

lfdirstate.normal(lfile)

181

lfdirstate.normal(lfile)

182

return s

182

return s

183

184

def listlfiles(repo, rev=None, matcher=None):

184

def listlfiles(repo, rev=None, matcher=None):

185

'''return a list of largefiles in the working copy or the

185

'''return a list of largefiles in the working copy or the

186

specified changeset'''

186

specified changeset'''

187

188

if matcher is None:

188

if matcher is None:

189

matcher = getstandinmatcher(repo)

189

matcher = getstandinmatcher(repo)

190

191

# ignore unknown files in working directory

191

# ignore unknown files in working directory

192

return [splitstandin(f)

192

return [splitstandin(f)

193

for f in repo[rev].walk(matcher)

193

for f in repo[rev].walk(matcher)

194

if rev is not None or repo.dirstate[f] != '?']

194

if rev is not None or repo.dirstate[f] != '?']

195

196

def instore(repo, hash, forcelocal=False):

196

def instore(repo, hash, forcelocal=False):

197

'''Return true if a largefile with the given hash exists in the store'''

197

'''Return true if a largefile with the given hash exists in the store'''

198

return os.path.exists(storepath(repo, hash, forcelocal))

198

return os.path.exists(storepath(repo, hash, forcelocal))

199

200

def storepath(repo, hash, forcelocal=False):

200

def storepath(repo, hash, forcelocal=False):

201

'''Return the correct location in the repository largefiles store for a

201

'''Return the correct location in the repository largefiles store for a

202

file with the given hash.'''

202

file with the given hash.'''

203

if not forcelocal and repo.shared():

203

if not forcelocal and repo.shared():

204

return repo.vfs.reljoin(repo.sharedpath, longname, hash)

204

return repo.vfs.reljoin(repo.sharedpath, longname, hash)

205

return repo.vfs.join(longname, hash)

205

return repo.vfs.join(longname, hash)

206

207

def findstorepath(repo, hash):

207

def findstorepath(repo, hash):

208

'''Search through the local store path(s) to find the file for the given

208

'''Search through the local store path(s) to find the file for the given

209

hash. If the file is not found, its path in the primary store is returned.

209

hash. If the file is not found, its path in the primary store is returned.

210

The return value is a tuple of (path, exists(path)).

210

The return value is a tuple of (path, exists(path)).

211

'''

211

'''

212

# For shared repos, the primary store is in the share source. But for

212

# For shared repos, the primary store is in the share source. But for

213

# backward compatibility, force a lookup in the local store if it wasn't

213

# backward compatibility, force a lookup in the local store if it wasn't

214

# found in the share source.

214

# found in the share source.

215

path = storepath(repo, hash, False)

215

path = storepath(repo, hash, False)

216

217

if instore(repo, hash):

217

if instore(repo, hash):

218

return (path, True)

218

return (path, True)

219

elif repo.shared() and instore(repo, hash, True):

219

elif repo.shared() and instore(repo, hash, True):

220

return storepath(repo, hash, True), True

220

return storepath(repo, hash, True), True

221

222

return (path, False)

222

return (path, False)

223

224

def copyfromcache(repo, hash, filename):

224

def copyfromcache(repo, hash, filename):

225

'''Copy the specified largefile from the repo or system cache to

225

'''Copy the specified largefile from the repo or system cache to

226

filename in the repository. Return true on success or false if the

226

filename in the repository. Return true on success or false if the

227

file was not found in either cache (which should not happened:

227

file was not found in either cache (which should not happened:

228

this is meant to be called only after ensuring that the needed

228

this is meant to be called only after ensuring that the needed

229

largefile exists in the cache).'''

229

largefile exists in the cache).'''

230

wvfs = repo.wvfs

230

wvfs = repo.wvfs

231

path = findfile(repo, hash)

231

path = findfile(repo, hash)

232

if path is None:

232

if path is None:

233

return False

233

return False

234

wvfs.makedirs(wvfs.dirname(wvfs.join(filename)))

234

wvfs.makedirs(wvfs.dirname(wvfs.join(filename)))

235

# The write may fail before the file is fully written, but we

235

# The write may fail before the file is fully written, but we

236

# don't use atomic writes in the working copy.

236

# don't use atomic writes in the working copy.

237

with open(path, 'rb') as srcfd:

237

with open(path, 'rb') as srcfd:

238

with wvfs(filename, 'wb') as destfd:

238

with wvfs(filename, 'wb') as destfd:

239

gothash = copyandhash(

239

gothash = copyandhash(

240

util.filechunkiter(srcfd), destfd)

240

util.filechunkiter(srcfd), destfd)

241

if gothash != hash:

241

if gothash != hash:

242

repo.ui.warn(_('%s: data corruption in %s with hash %s\n')

242

repo.ui.warn(_('%s: data corruption in %s with hash %s\n')

243

% (filename, path, gothash))

243

% (filename, path, gothash))

244

wvfs.unlink(filename)

244

wvfs.unlink(filename)

245

return False

245

return False

246

return True

246

return True

247

248

def copytostore(repo, revorctx, file, uploaded=False):

248

def copytostore(repo, revorctx, file, uploaded=False):

249

wvfs = repo.wvfs

249

wvfs = repo.wvfs

250

hash = readstandin(repo, file, revorctx)

250

hash = readstandin(repo, file, revorctx)

251

if instore(repo, hash):

251

if instore(repo, hash):

252

return

252

return

253

if wvfs.exists(file):

253

if wvfs.exists(file):

254

copytostoreabsolute(repo, wvfs.join(file), hash)

254

copytostoreabsolute(repo, wvfs.join(file), hash)

255

else:

255

else:

256

repo.ui.warn(_("%s: largefile %s not available from local store\n") %

256

repo.ui.warn(_("%s: largefile %s not available from local store\n") %

257

(file, hash))

257

(file, hash))

258

259

def copyalltostore(repo, node):

259

def copyalltostore(repo, node):

260

'''Copy all largefiles in a given revision to the store'''

260

'''Copy all largefiles in a given revision to the store'''

261

262

ctx = repo[node]

262

ctx = repo[node]

263

for filename in ctx.files():

263

for filename in ctx.files():

264

realfile = splitstandin(filename)

264

realfile = splitstandin(filename)

265

if realfile is not None and filename in ctx.manifest():

265

if realfile is not None and filename in ctx.manifest():

266

copytostore(repo, ctx, realfile)

266

copytostore(repo, ctx, realfile)

267

268

def copytostoreabsolute(repo, file, hash):

268

def copytostoreabsolute(repo, file, hash):

269

if inusercache(repo.ui, hash):

269

if inusercache(repo.ui, hash):

270

link(usercachepath(repo.ui, hash), storepath(repo, hash))

270

link(usercachepath(repo.ui, hash), storepath(repo, hash))

271

else:

271

else:

272

util.makedirs(os.path.dirname(storepath(repo, hash)))

272

util.makedirs(os.path.dirname(storepath(repo, hash)))

273

with open(file, 'rb') as srcf:

273

with open(file, 'rb') as srcf:

274

with util.atomictempfile(storepath(repo, hash),

274

with util.atomictempfile(storepath(repo, hash),

275

createmode=repo.store.createmode) as dstf:

275

createmode=repo.store.createmode) as dstf:

276

for chunk in util.filechunkiter(srcf):

276

for chunk in util.filechunkiter(srcf):

277

dstf.write(chunk)

277

dstf.write(chunk)

278

linktousercache(repo, hash)

278

linktousercache(repo, hash)

279

280

def linktousercache(repo, hash):

280

def linktousercache(repo, hash):

281

'''Link / copy the largefile with the specified hash from the store

281

'''Link / copy the largefile with the specified hash from the store

282

to the cache.'''

282

to the cache.'''

283

path = usercachepath(repo.ui, hash)

283

path = usercachepath(repo.ui, hash)

284

link(storepath(repo, hash), path)

284

link(storepath(repo, hash), path)

285

286

def getstandinmatcher(repo, rmatcher=None):

286

def getstandinmatcher(repo, rmatcher=None):

287

'''Return a match object that applies rmatcher to the standin directory'''

287

'''Return a match object that applies rmatcher to the standin directory'''

288

wvfs = repo.wvfs

288

wvfs = repo.wvfs

289

standindir = shortname

289

standindir = shortname

290

291

# no warnings about missing files or directories

291

# no warnings about missing files or directories

292

badfn = lambda f, msg: None

292

badfn = lambda f, msg: None

293

294

if rmatcher and not rmatcher.always():

294

if rmatcher and not rmatcher.always():

295

pats = [wvfs.join(standindir, pat) for pat in rmatcher.files()]

295

pats = [wvfs.join(standindir, pat) for pat in rmatcher.files()]

296

if not pats:

296

if not pats:

297

pats = [wvfs.join(standindir)]

297

pats = [wvfs.join(standindir)]

298

match = scmutil.match(repo[None], pats, badfn=badfn)

298

match = scmutil.match(repo[None], pats, badfn=badfn)

299

# if pats is empty, it would incorrectly always match, so clear _always

299

# if pats is empty, it would incorrectly always match, so clear _always

300

match._always = False

300

match._always = False

301

else:

301

else:

302

# no patterns: relative to repo root

302

# no patterns: relative to repo root

303

match = scmutil.match(repo[None], [wvfs.join(standindir)], badfn=badfn)

303

match = scmutil.match(repo[None], [wvfs.join(standindir)], badfn=badfn)

304

return match

304

return match

305

306

def composestandinmatcher(repo, rmatcher):

306

def composestandinmatcher(repo, rmatcher):

307

'''Return a matcher that accepts standins corresponding to the

307

'''Return a matcher that accepts standins corresponding to the

308

files accepted by rmatcher. Pass the list of files in the matcher

308

files accepted by rmatcher. Pass the list of files in the matcher

309

as the paths specified by the user.'''

309

as the paths specified by the user.'''

310

smatcher = getstandinmatcher(repo, rmatcher)

310

smatcher = getstandinmatcher(repo, rmatcher)

311

isstandin = smatcher.matchfn

311

isstandin = smatcher.matchfn

312

def composedmatchfn(f):

312

def composedmatchfn(f):

313

return isstandin(f) and rmatcher.matchfn(splitstandin(f))

313

return isstandin(f) and rmatcher.matchfn(splitstandin(f))

314

smatcher.matchfn = composedmatchfn

314

smatcher.matchfn = composedmatchfn

315

316

return smatcher

316

return smatcher

317

318

def standin(filename):

318

def standin(filename):

319

'''Return the repo-relative path to the standin for the specified big

319

'''Return the repo-relative path to the standin for the specified big

320

file.'''

320

file.'''

321

# Notes:

321

# Notes:

322

# 1) Some callers want an absolute path, but for instance addlargefiles

322

# 1) Some callers want an absolute path, but for instance addlargefiles

323

# needs it repo-relative so it can be passed to repo[None].add(). So

323

# needs it repo-relative so it can be passed to repo[None].add(). So

324

# leave it up to the caller to use repo.wjoin() to get an absolute path.

324

# leave it up to the caller to use repo.wjoin() to get an absolute path.

325

# 2) Join with '/' because that's what dirstate always uses, even on

325

# 2) Join with '/' because that's what dirstate always uses, even on

326

# Windows. Change existing separator to '/' first in case we are

326

# Windows. Change existing separator to '/' first in case we are

327

# passed filenames from an external source (like the command line).

327

# passed filenames from an external source (like the command line).

328

return shortnameslash + util.pconvert(filename)

328

return shortnameslash + util.pconvert(filename)

329

330

def isstandin(filename):

330

def isstandin(filename):

331

'''Return true if filename is a big file standin. filename must be

331

'''Return true if filename is a big file standin. filename must be

332

in Mercurial's internal form (slash-separated).'''

332

in Mercurial's internal form (slash-separated).'''

333

return filename.startswith(shortnameslash)

333

return filename.startswith(shortnameslash)

334

335

def splitstandin(filename):

335

def splitstandin(filename):

336

# Split on / because that's what dirstate always uses, even on Windows.

336

# Split on / because that's what dirstate always uses, even on Windows.

337

# Change local separator to / first just in case we are passed filenames

337

# Change local separator to / first just in case we are passed filenames

338

# from an external source (like the command line).

338

# from an external source (like the command line).

339

bits = util.pconvert(filename).split('/', 1)

339

bits = util.pconvert(filename).split('/', 1)

340

if len(bits) == 2 and bits[0] == shortname:

340

if len(bits) == 2 and bits[0] == shortname:

341

return bits[1]

341

return bits[1]

342

else:

342

else:

343

return None

343

return None

344

345

def updatestandin(repo, standin):

345

def updatestandin(repo, standin):

346

lfile = splitstandin(standin)

346

lfile = splitstandin(standin)

347

file = repo.wjoin(lfile)

347

file = repo.wjoin(lfile)

348

if repo.wvfs.exists(lfile):

348

if repo.wvfs.exists(lfile):

349

hash = hashfile(file)

349

hash = hashfile(file)

350

executable = getexecutable(file)

350

executable = getexecutable(file)

351

writestandin(repo, standin, hash, executable)

351

writestandin(repo, standin, hash, executable)

352

else:

352

else:

353

raise error.Abort(_('%s: file not found!') % lfile)

353

raise error.Abort(_('%s: file not found!') % lfile)

354

355

def readstandin(repo, filename, node=None):

355

def readstandin(repo, filename, node=None):

356

'''read hex hash from standin for filename at given node, or working

356

'''read hex hash from standin for filename at given node, or working

357

directory if no node is given'''

357

directory if no node is given'''

358

return repo[node][standin(filename)].data().strip()

358

return repo[node][standin(filename)].data().strip()

359

360

def writestandin(repo, standin, hash, executable):

360

def writestandin(repo, standin, hash, executable):

361

'''write hash to <repo.root>/<standin>'''

361

'''write hash to <repo.root>/<standin>'''

362

repo.wwrite(standin, hash + '\n', executable and 'x' or '')

362

repo.wwrite(standin, hash + '\n', executable and 'x' or '')

363

364

def copyandhash(instream, outfile):

364

def copyandhash(instream, outfile):

365

'''Read bytes from instream (iterable) and write them to outfile,

365

'''Read bytes from instream (iterable) and write them to outfile,

366

computing the SHA-1 hash of the data along the way. Return the hash.'''

366

computing the SHA-1 hash of the data along the way. Return the hash.'''

367

hasher = hashlib.sha1('')

367

hasher = hashlib.sha1('')

368

for data in instream:

368

for data in instream:

369

hasher.update(data)

369

hasher.update(data)

370

outfile.write(data)

370

outfile.write(data)

371

return hasher.hexdigest()

371

return hasher.hexdigest()

372

373

def hashfile(file):

373

def hashfile(file):

374

if not os.path.exists(file):

374

if not os.path.exists(file):

375

return ''

375

return ''

376

hasher = hashlib.sha1('')

377

with open(file, 'rb') as fd:

376

with open(file, 'rb') as fd:

378

for data in util.filechunkiter(fd):

377

return hexsha1(fd)

379

hasher.update(data)

380

return hasher.hexdigest()

381

378

382

def getexecutable(filename):

379

def getexecutable(filename):

383

mode = os.stat(filename).st_mode

380

mode = os.stat(filename).st_mode

384

return ((mode & stat.S_IXUSR) and

381

return ((mode & stat.S_IXUSR) and

385

(mode & stat.S_IXGRP) and

382

(mode & stat.S_IXGRP) and

386

(mode & stat.S_IXOTH))

383

(mode & stat.S_IXOTH))

387

384

388

def urljoin(first, second, *arg):

385

def urljoin(first, second, *arg):

389

def join(left, right):

386

def join(left, right):

390

if not left.endswith('/'):

387

if not left.endswith('/'):

391

left += '/'

388

left += '/'

392

if right.startswith('/'):

389

if right.startswith('/'):

393

right = right[1:]

390

right = right[1:]

394

return left + right

391

return left + right

395

392

396

url = join(first, second)

393

url = join(first, second)

397

for a in arg:

394

for a in arg:

398

url = join(url, a)

395

url = join(url, a)

399

return url

396

return url

400

397

401

def hexsha1(~~data~~):

398

def hexsha1(fileobj):

402

"""hexsha1 returns the hex-encoded sha1 sum of the data in the file-like

399

"""hexsha1 returns the hex-encoded sha1 sum of the data in the file-like

403

object data"""

400

object data"""

404

h = hashlib.sha1()

401

h = hashlib.sha1()

405

for chunk in util.filechunkiter(~~data~~):

402

for chunk in util.filechunkiter(fileobj):

406

h.update(chunk)

403

h.update(chunk)

407

return h.hexdigest()

404

return h.hexdigest()

408

405

409

def httpsendfile(ui, filename):

406

def httpsendfile(ui, filename):

410

return httpconnection.httpsendfile(ui, filename, 'rb')

407

return httpconnection.httpsendfile(ui, filename, 'rb')

411

408

412

def unixpath(path):

409

def unixpath(path):

413

'''Return a version of path normalized for use with the lfdirstate.'''

410

'''Return a version of path normalized for use with the lfdirstate.'''

414

return util.pconvert(os.path.normpath(path))

411

return util.pconvert(os.path.normpath(path))

415

412

416

def islfilesrepo(repo):

413

def islfilesrepo(repo):

417

'''Return true if the repo is a largefile repo.'''

414

'''Return true if the repo is a largefile repo.'''

418

if ('largefiles' in repo.requirements and

415

if ('largefiles' in repo.requirements and

419

any(shortnameslash in f[0] for f in repo.store.datafiles())):

416

any(shortnameslash in f[0] for f in repo.store.datafiles())):

420

return True

417

return True

421

418

422

return any(openlfdirstate(repo.ui, repo, False))

419

return any(openlfdirstate(repo.ui, repo, False))

423

420

424

class storeprotonotcapable(Exception):

421

class storeprotonotcapable(Exception):

425

def __init__(self, storetypes):

422

def __init__(self, storetypes):

426

self.storetypes = storetypes

423

self.storetypes = storetypes

427

424

428

def getstandinsstate(repo):

425

def getstandinsstate(repo):

429

standins = []

426

standins = []

430

matcher = getstandinmatcher(repo)

427

matcher = getstandinmatcher(repo)

431

for standin in repo.dirstate.walk(matcher, [], False, False):

428

for standin in repo.dirstate.walk(matcher, [], False, False):

432

lfile = splitstandin(standin)

429

lfile = splitstandin(standin)

433

try:

430

try:

434

hash = readstandin(repo, lfile)

431

hash = readstandin(repo, lfile)

435

except IOError:

432

except IOError:

436

hash = None

433

hash = None

437

standins.append((lfile, hash))

434

standins.append((lfile, hash))

438

return standins

435

return standins

439

436

440

def synclfdirstate(repo, lfdirstate, lfile, normallookup):

437

def synclfdirstate(repo, lfdirstate, lfile, normallookup):

441

lfstandin = standin(lfile)

438

lfstandin = standin(lfile)

442

if lfstandin in repo.dirstate:

439

if lfstandin in repo.dirstate:

443

stat = repo.dirstate._map[lfstandin]

440

stat = repo.dirstate._map[lfstandin]

444

state, mtime = stat[0], stat[3]

441

state, mtime = stat[0], stat[3]

445

else:

442

else:

446

state, mtime = '?', -1

443

state, mtime = '?', -1

447

if state == 'n':

444

if state == 'n':

448

if (normallookup or mtime < 0 or

445

if (normallookup or mtime < 0 or

449

not repo.wvfs.exists(lfile)):

446

not repo.wvfs.exists(lfile)):

450

# state 'n' doesn't ensure 'clean' in this case

447

# state 'n' doesn't ensure 'clean' in this case

451

lfdirstate.normallookup(lfile)

448

lfdirstate.normallookup(lfile)

452

else:

449

else:

453

lfdirstate.normal(lfile)

450

lfdirstate.normal(lfile)

454

elif state == 'm':

451

elif state == 'm':

455

lfdirstate.normallookup(lfile)

452

lfdirstate.normallookup(lfile)

456

elif state == 'r':

453

elif state == 'r':

457

lfdirstate.remove(lfile)

454

lfdirstate.remove(lfile)

458

elif state == 'a':

455

elif state == 'a':

459

lfdirstate.add(lfile)

456

lfdirstate.add(lfile)

460

elif state == '?':

457

elif state == '?':

461

lfdirstate.drop(lfile)

458

lfdirstate.drop(lfile)

462

459

463

def markcommitted(orig, ctx, node):

460

def markcommitted(orig, ctx, node):

464

repo = ctx.repo()

461

repo = ctx.repo()

465

462

466

orig(node)

463

orig(node)

467

464

468

# ATTENTION: "ctx.files()" may differ from "repo[node].files()"

465

# ATTENTION: "ctx.files()" may differ from "repo[node].files()"

469

# because files coming from the 2nd parent are omitted in the latter.

466

# because files coming from the 2nd parent are omitted in the latter.

470

#

467

#

471

# The former should be used to get targets of "synclfdirstate",

468

# The former should be used to get targets of "synclfdirstate",

472

# because such files:

469

# because such files:

473

# - are marked as "a" by "patch.patch()" (e.g. via transplant), and

470

# - are marked as "a" by "patch.patch()" (e.g. via transplant), and

474

# - have to be marked as "n" after commit, but

471

# - have to be marked as "n" after commit, but

475

# - aren't listed in "repo[node].files()"

472

# - aren't listed in "repo[node].files()"

476

473

477

lfdirstate = openlfdirstate(repo.ui, repo)

474

lfdirstate = openlfdirstate(repo.ui, repo)

478

for f in ctx.files():

475

for f in ctx.files():

479

lfile = splitstandin(f)

476

lfile = splitstandin(f)

480

if lfile is not None:

477

if lfile is not None:

481

synclfdirstate(repo, lfdirstate, lfile, False)

478

synclfdirstate(repo, lfdirstate, lfile, False)

482

lfdirstate.write()

479

lfdirstate.write()

483

480

484

# As part of committing, copy all of the largefiles into the cache.

481

# As part of committing, copy all of the largefiles into the cache.

485

#

482

#

486

# Using "node" instead of "ctx" implies additional "repo[node]"

483

# Using "node" instead of "ctx" implies additional "repo[node]"

487

# lookup while copyalltostore(), but can omit redundant check for

484

# lookup while copyalltostore(), but can omit redundant check for

488

# files comming from the 2nd parent, which should exist in store

485

# files comming from the 2nd parent, which should exist in store

489

# at merging.

486

# at merging.

490

copyalltostore(repo, node)

487

copyalltostore(repo, node)

491

488

492

def getlfilestoupdate(oldstandins, newstandins):

489

def getlfilestoupdate(oldstandins, newstandins):

493

changedstandins = set(oldstandins).symmetric_difference(set(newstandins))

490

changedstandins = set(oldstandins).symmetric_difference(set(newstandins))

494

filelist = []

491

filelist = []

495

for f in changedstandins:

492

for f in changedstandins:

496

if f[0] not in filelist:

493

if f[0] not in filelist:

497

filelist.append(f[0])

494

filelist.append(f[0])

498

return filelist

495

return filelist

499

496

500

def getlfilestoupload(repo, missing, addfunc):

497

def getlfilestoupload(repo, missing, addfunc):

501

for i, n in enumerate(missing):

498

for i, n in enumerate(missing):

502

repo.ui.progress(_('finding outgoing largefiles'), i,

499

repo.ui.progress(_('finding outgoing largefiles'), i,

503

unit=_('revisions'), total=len(missing))

500

unit=_('revisions'), total=len(missing))

504

parents = [p for p in repo[n].parents() if p != node.nullid]

501

parents = [p for p in repo[n].parents() if p != node.nullid]

505

502

506

oldlfstatus = repo.lfstatus

503

oldlfstatus = repo.lfstatus

507

repo.lfstatus = False

504

repo.lfstatus = False

508

try:

505

try:

509

ctx = repo[n]

506

ctx = repo[n]

510

finally:

507

finally:

511

repo.lfstatus = oldlfstatus

508

repo.lfstatus = oldlfstatus

512

509

513

files = set(ctx.files())

510

files = set(ctx.files())

514

if len(parents) == 2:

511

if len(parents) == 2:

515

mc = ctx.manifest()

512

mc = ctx.manifest()

516

mp1 = ctx.parents()[0].manifest()

513

mp1 = ctx.parents()[0].manifest()

517

mp2 = ctx.parents()[1].manifest()

514

mp2 = ctx.parents()[1].manifest()

518

for f in mp1:

515

for f in mp1:

519

if f not in mc:

516

if f not in mc:

520

files.add(f)

517

files.add(f)

521

for f in mp2:

518

for f in mp2:

522

if f not in mc:

519

if f not in mc:

523

files.add(f)

520

files.add(f)

524

for f in mc:

521

for f in mc:

525

if mc[f] != mp1.get(f, None) or mc[f] != mp2.get(f, None):

522

if mc[f] != mp1.get(f, None) or mc[f] != mp2.get(f, None):

526

files.add(f)

523

files.add(f)

527

for fn in files:

524

for fn in files:

528

if isstandin(fn) and fn in ctx:

525

if isstandin(fn) and fn in ctx:

529

addfunc(fn, ctx[fn].data().strip())

526

addfunc(fn, ctx[fn].data().strip())

530

repo.ui.progress(_('finding outgoing largefiles'), None)

527

repo.ui.progress(_('finding outgoing largefiles'), None)

531

528

532

def updatestandinsbymatch(repo, match):

529

def updatestandinsbymatch(repo, match):

533

'''Update standins in the working directory according to specified match

530

'''Update standins in the working directory according to specified match

534

531

535

This returns (possibly modified) ``match`` object to be used for

532

This returns (possibly modified) ``match`` object to be used for

536

subsequent commit process.

533

subsequent commit process.

537

'''

534

'''

538

535

539

ui = repo.ui

536

ui = repo.ui

540

537

541

# Case 1: user calls commit with no specific files or

538

# Case 1: user calls commit with no specific files or

542

# include/exclude patterns: refresh and commit all files that

539

# include/exclude patterns: refresh and commit all files that

543

# are "dirty".

540

# are "dirty".

544

if match is None or match.always():

541

if match is None or match.always():

545

# Spend a bit of time here to get a list of files we know

542

# Spend a bit of time here to get a list of files we know

546

# are modified so we can compare only against those.

543

# are modified so we can compare only against those.

547

# It can cost a lot of time (several seconds)

544

# It can cost a lot of time (several seconds)

548

# otherwise to update all standins if the largefiles are

545

# otherwise to update all standins if the largefiles are

549

# large.

546

# large.

550

lfdirstate = openlfdirstate(ui, repo)

547

lfdirstate = openlfdirstate(ui, repo)

551

dirtymatch = matchmod.always(repo.root, repo.getcwd())

548

dirtymatch = matchmod.always(repo.root, repo.getcwd())

552

unsure, s = lfdirstate.status(dirtymatch, [], False, False,

549

unsure, s = lfdirstate.status(dirtymatch, [], False, False,

553

False)

550

False)

554

modifiedfiles = unsure + s.modified + s.added + s.removed

551

modifiedfiles = unsure + s.modified + s.added + s.removed

555

lfiles = listlfiles(repo)

552

lfiles = listlfiles(repo)

556

# this only loops through largefiles that exist (not

553

# this only loops through largefiles that exist (not

557

# removed/renamed)

554

# removed/renamed)

558

for lfile in lfiles:

555

for lfile in lfiles:

559

if lfile in modifiedfiles:

556

if lfile in modifiedfiles:

560

fstandin = standin(lfile)

557

fstandin = standin(lfile)

561

if repo.wvfs.exists(fstandin):

558

if repo.wvfs.exists(fstandin):

562

# this handles the case where a rebase is being

559

# this handles the case where a rebase is being

563

# performed and the working copy is not updated

560

# performed and the working copy is not updated

564

# yet.

561

# yet.

565

if repo.wvfs.exists(lfile):

562

if repo.wvfs.exists(lfile):

566

updatestandin(repo, fstandin)

563

updatestandin(repo, fstandin)

567

564

568

return match

565

return match

569

566

570

lfiles = listlfiles(repo)

567

lfiles = listlfiles(repo)

571

match._files = repo._subdirlfs(match.files(), lfiles)

568

match._files = repo._subdirlfs(match.files(), lfiles)

572

569

573

# Case 2: user calls commit with specified patterns: refresh

570

# Case 2: user calls commit with specified patterns: refresh

574

# any matching big files.

571

# any matching big files.

575

smatcher = composestandinmatcher(repo, match)

572

smatcher = composestandinmatcher(repo, match)

576

standins = repo.dirstate.walk(smatcher, [], False, False)

573

standins = repo.dirstate.walk(smatcher, [], False, False)

577

574

578

# No matching big files: get out of the way and pass control to

575

# No matching big files: get out of the way and pass control to

579

# the usual commit() method.

576

# the usual commit() method.

580

if not standins:

577

if not standins:

581

return match

578

return match

582

579

583

# Refresh all matching big files. It's possible that the

580

# Refresh all matching big files. It's possible that the

584

# commit will end up failing, in which case the big files will

581

# commit will end up failing, in which case the big files will

585

# stay refreshed. No harm done: the user modified them and

582

# stay refreshed. No harm done: the user modified them and

586

# asked to commit them, so sooner or later we're going to

583

# asked to commit them, so sooner or later we're going to

587

# refresh the standins. Might as well leave them refreshed.

584

# refresh the standins. Might as well leave them refreshed.

588

lfdirstate = openlfdirstate(ui, repo)

585

lfdirstate = openlfdirstate(ui, repo)

589

for fstandin in standins:

586

for fstandin in standins:

590

lfile = splitstandin(fstandin)

587

lfile = splitstandin(fstandin)

591

if lfdirstate[lfile] != 'r':

588

if lfdirstate[lfile] != 'r':

592

updatestandin(repo, fstandin)

589

updatestandin(repo, fstandin)

593

590

594

# Cook up a new matcher that only matches regular files or

591

# Cook up a new matcher that only matches regular files or

595

# standins corresponding to the big files requested by the

592

# standins corresponding to the big files requested by the

596

# user. Have to modify _files to prevent commit() from

593

# user. Have to modify _files to prevent commit() from

597

# complaining "not tracked" for big files.

594

# complaining "not tracked" for big files.

598

match = copy.copy(match)

595

match = copy.copy(match)

599

origmatchfn = match.matchfn

596

origmatchfn = match.matchfn

600

597

601

# Check both the list of largefiles and the list of

598

# Check both the list of largefiles and the list of

602

# standins because if a largefile was removed, it

599

# standins because if a largefile was removed, it

603

# won't be in the list of largefiles at this point

600

# won't be in the list of largefiles at this point

604

match._files += sorted(standins)

601

match._files += sorted(standins)

605

602

606

actualfiles = []

603

actualfiles = []

607

for f in match._files:

604

for f in match._files:

608

fstandin = standin(f)

605

fstandin = standin(f)

609

606

610

# For largefiles, only one of the normal and standin should be

607

# For largefiles, only one of the normal and standin should be

611

# committed (except if one of them is a remove). In the case of a

608

# committed (except if one of them is a remove). In the case of a

612

# standin removal, drop the normal file if it is unknown to dirstate.

609

# standin removal, drop the normal file if it is unknown to dirstate.

613

# Thus, skip plain largefile names but keep the standin.

610

# Thus, skip plain largefile names but keep the standin.

614

if f in lfiles or fstandin in standins:

611

if f in lfiles or fstandin in standins:

615

if repo.dirstate[fstandin] != 'r':

612

if repo.dirstate[fstandin] != 'r':

616

if repo.dirstate[f] != 'r':

613

if repo.dirstate[f] != 'r':

617

continue

614

continue

618

elif repo.dirstate[f] == '?':

615

elif repo.dirstate[f] == '?':

619

continue

616

continue

620

617

621

actualfiles.append(f)

618

actualfiles.append(f)

622

match._files = actualfiles

619

match._files = actualfiles

623

620

624

def matchfn(f):

621

def matchfn(f):

625

if origmatchfn(f):

622

if origmatchfn(f):

626

return f not in lfiles

623

return f not in lfiles

627

else:

624

else:

628

return f in standins

625

return f in standins

629

626

630

match.matchfn = matchfn

627

match.matchfn = matchfn

631

628

632

return match

629

return match

633

630

634

class automatedcommithook(object):

631

class automatedcommithook(object):

635

'''Stateful hook to update standins at the 1st commit of resuming

632

'''Stateful hook to update standins at the 1st commit of resuming

636

633

637

For efficiency, updating standins in the working directory should

634

For efficiency, updating standins in the working directory should

638

be avoided while automated committing (like rebase, transplant and

635

be avoided while automated committing (like rebase, transplant and

639

so on), because they should be updated before committing.

636

so on), because they should be updated before committing.

640

637

641

But the 1st commit of resuming automated committing (e.g. ``rebase

638

But the 1st commit of resuming automated committing (e.g. ``rebase

642

--continue``) should update them, because largefiles may be

639

--continue``) should update them, because largefiles may be

643

modified manually.

640

modified manually.

644

'''

641

'''

645

def __init__(self, resuming):

642

def __init__(self, resuming):

646

self.resuming = resuming

643

self.resuming = resuming

647

644

648

def __call__(self, repo, match):

645

def __call__(self, repo, match):

649

if self.resuming:

646

if self.resuming:

650

self.resuming = False # avoids updating at subsequent commits

647

self.resuming = False # avoids updating at subsequent commits

651

return updatestandinsbymatch(repo, match)

648

return updatestandinsbymatch(repo, match)

652

else:

649

else:

653

return match

650

return match

654

651

655

def getstatuswriter(ui, repo, forcibly=None):

652

def getstatuswriter(ui, repo, forcibly=None):

656

'''Return the function to write largefiles specific status out

653

'''Return the function to write largefiles specific status out

657

654

658

If ``forcibly`` is ``None``, this returns the last element of

655

If ``forcibly`` is ``None``, this returns the last element of

659

``repo._lfstatuswriters`` as "default" writer function.

656

``repo._lfstatuswriters`` as "default" writer function.

660

657

661

Otherwise, this returns the function to always write out (or

658

Otherwise, this returns the function to always write out (or

662

ignore if ``not forcibly``) status.

659

ignore if ``not forcibly``) status.

663

'''

660

'''

664

if forcibly is None and util.safehasattr(repo, '_largefilesenabled'):

661

if forcibly is None and util.safehasattr(repo, '_largefilesenabled'):

665

return repo._lfstatuswriters[-1]

662

return repo._lfstatuswriters[-1]

666

else:

663

else:

667

if forcibly:

664

if forcibly:

668

return ui.status # forcibly WRITE OUT

665

return ui.status # forcibly WRITE OUT

669

else:

666

else:

670

return lambda *msg, **opts: None # forcibly IGNORE

667

return lambda *msg, **opts: None # forcibly IGNORE

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # Copyright 2009-2010 Gregory P. Ward
             # Copyright 2009-2010 Intelerad Medical Systems Incorporated
             # Copyright 2010-2011 Fog Creek Software
             # Copyright 2010-2011 Unity Technologies
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             '''largefiles utility code: must not import other modules in this package.'''
             from __future__ import absolute_import
             import copy
             import hashlib
             import os
             import platform
             import stat
             from mercurial.i18n import _
             from mercurial import (
                 dirstate,
                 encoding,
                 error,
                 httpconnection,
                 match as matchmod,
                 node,
                 pycompat,
                 scmutil,
                 util,
                 vfs as vfsmod,
             )
             shortname = '.hglf'
             shortnameslash = shortname + '/'
             longname = 'largefiles'
             # -- Private worker functions ------------------------------------------
             def getminsize(ui, assumelfiles, opt, default=10):
                 lfsize = opt
                 if not lfsize and assumelfiles:
                     lfsize = ui.config(longname, 'minsize', default=default)
                 if lfsize:
                     try:
                         lfsize = float(lfsize)
                     except ValueError:
                         raise error.Abort(_('largefiles: size must be number (not %s)\n')
                                          % lfsize)
                 if lfsize is None:
                     raise error.Abort(_('minimum size for largefiles must be specified'))
                 return lfsize
             def link(src, dest):
                 """Try to create hardlink - if that fails, efficiently make a copy."""
                 util.makedirs(os.path.dirname(dest))
                 try:
                     util.oslink(src, dest)
                 except OSError:
                     # if hardlinks fail, fallback on atomic copy
                     with open(src, 'rb') as srcf:
                         with util.atomictempfile(dest) as dstf:
                             for chunk in util.filechunkiter(srcf):
                                 dstf.write(chunk)
                     os.chmod(dest, os.stat(src).st_mode)
             def usercachepath(ui, hash):
                 '''Return the correct location in the "global" largefiles cache for a file
                 with the given hash.
                 This cache is used for sharing of largefiles across repositories - both
                 to preserve download bandwidth and storage space.'''
                 return os.path.join(_usercachedir(ui), hash)
             def _usercachedir(ui):
                 '''Return the location of the "global" largefiles cache.'''
                 path = ui.configpath(longname, 'usercache', None)
                 if path:
                     return path
                 if pycompat.osname == 'nt':
                     appdata = encoding.environ.get('LOCALAPPDATA',\
                                     encoding.environ.get('APPDATA'))
                     if appdata:
                         return os.path.join(appdata, longname)
                 elif platform.system() == 'Darwin':
                     home = encoding.environ.get('HOME')
                     if home:
                         return os.path.join(home, 'Library', 'Caches', longname)
                 elif pycompat.osname == 'posix':
                     path = encoding.environ.get('XDG_CACHE_HOME')
                     if path:
                         return os.path.join(path, longname)
                     home = encoding.environ.get('HOME')
                     if home:
                         return os.path.join(home, '.cache', longname)
                 else:
                     raise error.Abort(_('unknown operating system: %s\n')
                                       % pycompat.osname)
                 raise error.Abort(_('unknown %s usercache location') % longname)
             def inusercache(ui, hash):
                 path = usercachepath(ui, hash)
                 return os.path.exists(path)
             def findfile(repo, hash):
                 '''Return store path of the largefile with the specified hash.
                 As a side effect, the file might be linked from user cache.
                 Return None if the file can't be found locally.'''
                 path, exists = findstorepath(repo, hash)
                 if exists:
                     repo.ui.note(_('found %s in store\n') % hash)
                     return path
                 elif inusercache(repo.ui, hash):
                     repo.ui.note(_('found %s in system cache\n') % hash)
                     path = storepath(repo, hash)
                     link(usercachepath(repo.ui, hash), path)
                     return path
                 return None
             class largefilesdirstate(dirstate.dirstate):
                 def __getitem__(self, key):
                     return super(largefilesdirstate, self).__getitem__(unixpath(key))
                 def normal(self, f):
                     return super(largefilesdirstate, self).normal(unixpath(f))
                 def remove(self, f):
                     return super(largefilesdirstate, self).remove(unixpath(f))
                 def add(self, f):
                     return super(largefilesdirstate, self).add(unixpath(f))
                 def drop(self, f):
                     return super(largefilesdirstate, self).drop(unixpath(f))
                 def forget(self, f):
                     return super(largefilesdirstate, self).forget(unixpath(f))
                 def normallookup(self, f):
                     return super(largefilesdirstate, self).normallookup(unixpath(f))
                 def _ignore(self, f):
                     return False
                 def write(self, tr=False):
                     # (1) disable PENDING mode always
                     #     (lfdirstate isn't yet managed as a part of the transaction)
                     # (2) avoid develwarn 'use dirstate.write with ....'
                     super(largefilesdirstate, self).write(None)
             def openlfdirstate(ui, repo, create=True):
                 '''
                 Return a dirstate object that tracks largefiles: i.e. its root is
                 the repo root, but it is saved in .hg/largefiles/dirstate.
                 '''
                 vfs = repo.vfs
                 lfstoredir = longname
                 opener = vfsmod.vfs(vfs.join(lfstoredir))
                 lfdirstate = largefilesdirstate(opener, ui, repo.root,
                                                  repo.dirstate._validate)
                 # If the largefiles dirstate does not exist, populate and create
                 # it. This ensures that we create it on the first meaningful
                 # largefiles operation in a new clone.
                 if create and not vfs.exists(vfs.join(lfstoredir, 'dirstate')):
                     matcher = getstandinmatcher(repo)
                     standins = repo.dirstate.walk(matcher, [], False, False)
                     if len(standins) > 0:
                         vfs.makedirs(lfstoredir)
                     for standin in standins:
                         lfile = splitstandin(standin)
                         lfdirstate.normallookup(lfile)
                 return lfdirstate
             def lfdirstatestatus(lfdirstate, repo):
                 wctx = repo['.']
                 match = matchmod.always(repo.root, repo.getcwd())
                 unsure, s = lfdirstate.status(match, [], False, False, False)
                 modified, clean = s.modified, s.clean
                 for lfile in unsure:
                     try:
                         fctx = wctx[standin(lfile)]
                     except LookupError:
                         fctx = None
                     if not fctx or fctx.data().strip() != hashfile(repo.wjoin(lfile)):
                         modified.append(lfile)
                     else:
                         clean.append(lfile)
                         lfdirstate.normal(lfile)
                 return s
             def listlfiles(repo, rev=None, matcher=None):
                 '''return a list of largefiles in the working copy or the
                 specified changeset'''
                 if matcher is None:
                     matcher = getstandinmatcher(repo)
                 # ignore unknown files in working directory
                 return [splitstandin(f)
                         for f in repo[rev].walk(matcher)
                         if rev is not None or repo.dirstate[f] != '?']
             def instore(repo, hash, forcelocal=False):
                 '''Return true if a largefile with the given hash exists in the store'''
                 return os.path.exists(storepath(repo, hash, forcelocal))
             def storepath(repo, hash, forcelocal=False):
                 '''Return the correct location in the repository largefiles store for a
                 file with the given hash.'''
                 if not forcelocal and repo.shared():
                     return repo.vfs.reljoin(repo.sharedpath, longname, hash)
                 return repo.vfs.join(longname, hash)
             def findstorepath(repo, hash):
                 '''Search through the local store path(s) to find the file for the given
                 hash.  If the file is not found, its path in the primary store is returned.
                 The return value is a tuple of (path, exists(path)).
                 '''
                 # For shared repos, the primary store is in the share source.  But for
                 # backward compatibility, force a lookup in the local store if it wasn't
                 # found in the share source.
                 path = storepath(repo, hash, False)
                 if instore(repo, hash):
                     return (path, True)
                 elif repo.shared() and instore(repo, hash, True):
                     return storepath(repo, hash, True), True
                 return (path, False)
             def copyfromcache(repo, hash, filename):
                 '''Copy the specified largefile from the repo or system cache to
                 filename in the repository. Return true on success or false if the
                 file was not found in either cache (which should not happened:
                 this is meant to be called only after ensuring that the needed
                 largefile exists in the cache).'''
                 wvfs = repo.wvfs
                 path = findfile(repo, hash)
                 if path is None:
                     return False
                 wvfs.makedirs(wvfs.dirname(wvfs.join(filename)))
                 # The write may fail before the file is fully written, but we
                 # don't use atomic writes in the working copy.
                 with open(path, 'rb') as srcfd:
                     with wvfs(filename, 'wb') as destfd:
                         gothash = copyandhash(
                             util.filechunkiter(srcfd), destfd)
                 if gothash != hash:
                     repo.ui.warn(_('%s: data corruption in %s with hash %s\n')
                                  % (filename, path, gothash))
                     wvfs.unlink(filename)
                     return False
                 return True
             def copytostore(repo, revorctx, file, uploaded=False):
                 wvfs = repo.wvfs
                 hash = readstandin(repo, file, revorctx)
                 if instore(repo, hash):
                     return
                 if wvfs.exists(file):
                     copytostoreabsolute(repo, wvfs.join(file), hash)
                 else:
                     repo.ui.warn(_("%s: largefile %s not available from local store\n") %
                                  (file, hash))
             def copyalltostore(repo, node):
                 '''Copy all largefiles in a given revision to the store'''
                 ctx = repo[node]
                 for filename in ctx.files():
                     realfile = splitstandin(filename)
                     if realfile is not None and filename in ctx.manifest():
                         copytostore(repo, ctx, realfile)
             def copytostoreabsolute(repo, file, hash):
                 if inusercache(repo.ui, hash):
                     link(usercachepath(repo.ui, hash), storepath(repo, hash))
                 else:
                     util.makedirs(os.path.dirname(storepath(repo, hash)))
                     with open(file, 'rb') as srcf:
                         with util.atomictempfile(storepath(repo, hash),
                                                  createmode=repo.store.createmode) as dstf:
                             for chunk in util.filechunkiter(srcf):
                                 dstf.write(chunk)
                     linktousercache(repo, hash)
             def linktousercache(repo, hash):
                 '''Link / copy the largefile with the specified hash from the store
                 to the cache.'''
                 path = usercachepath(repo.ui, hash)
                 link(storepath(repo, hash), path)
             def getstandinmatcher(repo, rmatcher=None):
                 '''Return a match object that applies rmatcher to the standin directory'''
                 wvfs = repo.wvfs
                 standindir = shortname
                 # no warnings about missing files or directories
                 badfn = lambda f, msg: None
                 if rmatcher and not rmatcher.always():
                     pats = [wvfs.join(standindir, pat) for pat in rmatcher.files()]
                     if not pats:
                         pats = [wvfs.join(standindir)]
                     match = scmutil.match(repo[None], pats, badfn=badfn)
                     # if pats is empty, it would incorrectly always match, so clear _always
                     match._always = False
                 else:
                     # no patterns: relative to repo root
                     match = scmutil.match(repo[None], [wvfs.join(standindir)], badfn=badfn)
                 return match
             def composestandinmatcher(repo, rmatcher):
                 '''Return a matcher that accepts standins corresponding to the
                 files accepted by rmatcher. Pass the list of files in the matcher
                 as the paths specified by the user.'''
                 smatcher = getstandinmatcher(repo, rmatcher)
                 isstandin = smatcher.matchfn
                 def composedmatchfn(f):
                     return isstandin(f) and rmatcher.matchfn(splitstandin(f))
                 smatcher.matchfn = composedmatchfn
                 return smatcher
             def standin(filename):
                 '''Return the repo-relative path to the standin for the specified big
                 file.'''
                 # Notes:
                 # 1) Some callers want an absolute path, but for instance addlargefiles
                 #    needs it repo-relative so it can be passed to repo[None].add().  So
                 #    leave it up to the caller to use repo.wjoin() to get an absolute path.
                 # 2) Join with '/' because that's what dirstate always uses, even on
                 #    Windows. Change existing separator to '/' first in case we are
                 #    passed filenames from an external source (like the command line).
                 return shortnameslash + util.pconvert(filename)
             def isstandin(filename):
                 '''Return true if filename is a big file standin. filename must be
                 in Mercurial's internal form (slash-separated).'''
                 return filename.startswith(shortnameslash)
             def splitstandin(filename):
                 # Split on / because that's what dirstate always uses, even on Windows.
                 # Change local separator to / first just in case we are passed filenames
                 # from an external source (like the command line).
                 bits = util.pconvert(filename).split('/', 1)
                 if len(bits) == 2 and bits[0] == shortname:
                     return bits[1]
                 else:
                     return None
             def updatestandin(repo, standin):
                 lfile = splitstandin(standin)
                 file = repo.wjoin(lfile)
                 if repo.wvfs.exists(lfile):
                     hash = hashfile(file)
                     executable = getexecutable(file)
                     writestandin(repo, standin, hash, executable)
                 else:
                     raise error.Abort(_('%s: file not found!') % lfile)
             def readstandin(repo, filename, node=None):
                 '''read hex hash from standin for filename at given node, or working
                 directory if no node is given'''
                 return repo[node][standin(filename)].data().strip()
             def writestandin(repo, standin, hash, executable):
                 '''write hash to <repo.root>/<standin>'''
                 repo.wwrite(standin, hash + '\n', executable and 'x' or '')
             def copyandhash(instream, outfile):
                 '''Read bytes from instream (iterable) and write them to outfile,
                 computing the SHA-1 hash of the data along the way. Return the hash.'''
                 hasher = hashlib.sha1('')
                 for data in instream:
                     hasher.update(data)
                     outfile.write(data)
                 return hasher.hexdigest()
             def hashfile(file):
                 if not os.path.exists(file):
                     return ''
-                hasher = hashlib.sha1('')
                 with open(file, 'rb') as fd:
-                    for data in util.filechunkiter(fd):
+                    return hexsha1(fd)
-                        hasher.update(data)
-                return hasher.hexdigest()
             def getexecutable(filename):
                 mode = os.stat(filename).st_mode
                 return ((mode & stat.S_IXUSR) and
                         (mode & stat.S_IXGRP) and
                         (mode & stat.S_IXOTH))
             def urljoin(first, second, *arg):
                 def join(left, right):
                     if not left.endswith('/'):
                         left += '/'
                     if right.startswith('/'):
                         right = right[1:]
                     return left + right
                 url = join(first, second)
                 for a in arg:
                     url = join(url, a)
                 return url
-            def hexsha1(data):
+            def hexsha1(fileobj):
                 """hexsha1 returns the hex-encoded sha1 sum of the data in the file-like
                 object data"""
                 h = hashlib.sha1()
-                for chunk in util.filechunkiter(data):
+                for chunk in util.filechunkiter(fileobj):
                     h.update(chunk)
                 return h.hexdigest()
             def httpsendfile(ui, filename):
                 return httpconnection.httpsendfile(ui, filename, 'rb')
             def unixpath(path):
                 '''Return a version of path normalized for use with the lfdirstate.'''
                 return util.pconvert(os.path.normpath(path))
             def islfilesrepo(repo):
                 '''Return true if the repo is a largefile repo.'''
                 if ('largefiles' in repo.requirements and
                         any(shortnameslash in f[0] for f in repo.store.datafiles())):
                     return True
                 return any(openlfdirstate(repo.ui, repo, False))
             class storeprotonotcapable(Exception):
                 def __init__(self, storetypes):
                     self.storetypes = storetypes
             def getstandinsstate(repo):
                 standins = []
                 matcher = getstandinmatcher(repo)
                 for standin in repo.dirstate.walk(matcher, [], False, False):
                     lfile = splitstandin(standin)
                     try:
                         hash = readstandin(repo, lfile)
                     except IOError:
                         hash = None
                     standins.append((lfile, hash))
                 return standins
             def synclfdirstate(repo, lfdirstate, lfile, normallookup):
                 lfstandin = standin(lfile)
                 if lfstandin in repo.dirstate:
                     stat = repo.dirstate._map[lfstandin]
                     state, mtime = stat[0], stat[3]
                 else:
                     state, mtime = '?', -1
                 if state == 'n':
                     if (normallookup or mtime < 0 or
                         not repo.wvfs.exists(lfile)):
                         # state 'n' doesn't ensure 'clean' in this case
                         lfdirstate.normallookup(lfile)
                     else:
                         lfdirstate.normal(lfile)
                 elif state == 'm':
                     lfdirstate.normallookup(lfile)
                 elif state == 'r':
                     lfdirstate.remove(lfile)
                 elif state == 'a':
                     lfdirstate.add(lfile)
                 elif state == '?':
                     lfdirstate.drop(lfile)
             def markcommitted(orig, ctx, node):
                 repo = ctx.repo()
                 orig(node)
                 # ATTENTION: "ctx.files()" may differ from "repo[node].files()"
                 # because files coming from the 2nd parent are omitted in the latter.
                 #
                 # The former should be used to get targets of "synclfdirstate",
                 # because such files:
                 # - are marked as "a" by "patch.patch()" (e.g. via transplant), and
                 # - have to be marked as "n" after commit, but
                 # - aren't listed in "repo[node].files()"
                 lfdirstate = openlfdirstate(repo.ui, repo)
                 for f in ctx.files():
                     lfile = splitstandin(f)
                     if lfile is not None:
                         synclfdirstate(repo, lfdirstate, lfile, False)
                 lfdirstate.write()
                 # As part of committing, copy all of the largefiles into the cache.
                 #
                 # Using "node" instead of "ctx" implies additional "repo[node]"
                 # lookup while copyalltostore(), but can omit redundant check for
                 # files comming from the 2nd parent, which should exist in store
                 # at merging.
                 copyalltostore(repo, node)
             def getlfilestoupdate(oldstandins, newstandins):
                 changedstandins = set(oldstandins).symmetric_difference(set(newstandins))
                 filelist = []
                 for f in changedstandins:
                     if f[0] not in filelist:
                         filelist.append(f[0])
                 return filelist
             def getlfilestoupload(repo, missing, addfunc):
                 for i, n in enumerate(missing):
                     repo.ui.progress(_('finding outgoing largefiles'), i,
                         unit=_('revisions'), total=len(missing))
                     parents = [p for p in repo[n].parents() if p != node.nullid]
                     oldlfstatus = repo.lfstatus
                     repo.lfstatus = False
                     try:
                         ctx = repo[n]
                     finally:
                         repo.lfstatus = oldlfstatus
                     files = set(ctx.files())
                     if len(parents) == 2:
                         mc = ctx.manifest()
                         mp1 = ctx.parents()[0].manifest()
                         mp2 = ctx.parents()[1].manifest()
                         for f in mp1:
                             if f not in mc:
                                 files.add(f)
                         for f in mp2:
                             if f not in mc:
                                 files.add(f)
                         for f in mc:
                             if mc[f] != mp1.get(f, None) or mc[f] != mp2.get(f, None):
                                 files.add(f)
                     for fn in files:
                         if isstandin(fn) and fn in ctx:
                             addfunc(fn, ctx[fn].data().strip())
                 repo.ui.progress(_('finding outgoing largefiles'), None)
             def updatestandinsbymatch(repo, match):
                 '''Update standins in the working directory according to specified match
                 This returns (possibly modified) ``match`` object to be used for
                 subsequent commit process.
                 '''
                 ui = repo.ui
                 # Case 1: user calls commit with no specific files or
                 # include/exclude patterns: refresh and commit all files that
                 # are "dirty".
                 if match is None or match.always():
                     # Spend a bit of time here to get a list of files we know
                     # are modified so we can compare only against those.
                     # It can cost a lot of time (several seconds)
                     # otherwise to update all standins if the largefiles are
                     # large.
                     lfdirstate = openlfdirstate(ui, repo)
                     dirtymatch = matchmod.always(repo.root, repo.getcwd())
                     unsure, s = lfdirstate.status(dirtymatch, [], False, False,
                                                   False)
                     modifiedfiles = unsure + s.modified + s.added + s.removed
                     lfiles = listlfiles(repo)
                     # this only loops through largefiles that exist (not
                     # removed/renamed)
                     for lfile in lfiles:
                         if lfile in modifiedfiles:
                             fstandin = standin(lfile)
                             if repo.wvfs.exists(fstandin):
                                 # this handles the case where a rebase is being
                                 # performed and the working copy is not updated
                                 # yet.
                                 if repo.wvfs.exists(lfile):
                                     updatestandin(repo, fstandin)
                     return match
                 lfiles = listlfiles(repo)
                 match._files = repo._subdirlfs(match.files(), lfiles)
                 # Case 2: user calls commit with specified patterns: refresh
                 # any matching big files.
                 smatcher = composestandinmatcher(repo, match)
                 standins = repo.dirstate.walk(smatcher, [], False, False)
                 # No matching big files: get out of the way and pass control to
                 # the usual commit() method.
                 if not standins:
                     return match
                 # Refresh all matching big files.  It's possible that the
                 # commit will end up failing, in which case the big files will
                 # stay refreshed.  No harm done: the user modified them and
                 # asked to commit them, so sooner or later we're going to
                 # refresh the standins.  Might as well leave them refreshed.
                 lfdirstate = openlfdirstate(ui, repo)
                 for fstandin in standins:
                     lfile = splitstandin(fstandin)
                     if lfdirstate[lfile] != 'r':
                         updatestandin(repo, fstandin)
                 # Cook up a new matcher that only matches regular files or
                 # standins corresponding to the big files requested by the
                 # user.  Have to modify _files to prevent commit() from
                 # complaining "not tracked" for big files.
                 match = copy.copy(match)
                 origmatchfn = match.matchfn
                 # Check both the list of largefiles and the list of
                 # standins because if a largefile was removed, it
                 # won't be in the list of largefiles at this point
                 match._files += sorted(standins)
                 actualfiles = []
                 for f in match._files:
                     fstandin = standin(f)
                     # For largefiles, only one of the normal and standin should be
                     # committed (except if one of them is a remove).  In the case of a
                     # standin removal, drop the normal file if it is unknown to dirstate.
                     # Thus, skip plain largefile names but keep the standin.
                     if f in lfiles or fstandin in standins:
                         if repo.dirstate[fstandin] != 'r':
                             if repo.dirstate[f] != 'r':
                                 continue
                         elif repo.dirstate[f] == '?':
                             continue
                     actualfiles.append(f)
                 match._files = actualfiles
                 def matchfn(f):
                     if origmatchfn(f):
                         return f not in lfiles
                     else:
                         return f in standins
                 match.matchfn = matchfn
                 return match
             class automatedcommithook(object):
                 '''Stateful hook to update standins at the 1st commit of resuming
                 For efficiency, updating standins in the working directory should
                 be avoided while automated committing (like rebase, transplant and
                 so on), because they should be updated before committing.
                 But the 1st commit of resuming automated committing (e.g. ``rebase
                 --continue``) should update them, because largefiles may be
                 modified manually.
                 '''
                 def __init__(self, resuming):
                     self.resuming = resuming
                 def __call__(self, repo, match):
                     if self.resuming:
                         self.resuming = False # avoids updating at subsequent commits
                         return updatestandinsbymatch(repo, match)
                     else:
                         return match
             def getstatuswriter(ui, repo, forcibly=None):
                 '''Return the function to write largefiles specific status out
                 If ``forcibly`` is ``None``, this returns the last element of
                 ``repo._lfstatuswriters`` as "default" writer function.
                 Otherwise, this returns the function to always write out (or
                 ignore if ``not forcibly``) status.
                 '''
                 if forcibly is None and util.safehasattr(repo, '_largefilesenabled'):
                     return repo._lfstatuswriters[-1]
                 else:
                     if forcibly:
                         return ui.status # forcibly WRITE OUT
                     else:
                         return lambda *msg, **opts: None # forcibly IGNORE