upstream/mercurial-mirror Commit - r31734:44ff5e4f

1

2

3

4

5

#

5

#

6

# This software may be used and distributed according to the terms of the

6

# This software may be used and distributed according to the terms of the

7

# GNU General Public License version 2 or any later version.

7

# GNU General Public License version 2 or any later version.

8

9

'''largefiles utility code: must not import other modules in this package.'''

9

'''largefiles utility code: must not import other modules in this package.'''

10

from __future__ import absolute_import

10

from __future__ import absolute_import

11

12

import copy

12

import copy

13

import hashlib

13

import hashlib

14

import os

14

import os

15

import platform

15

import platform

16

import stat

16

import stat

17

18

from mercurial.i18n import _

18

from mercurial.i18n import _

19

20

from mercurial import (

20

from mercurial import (

21

dirstate,

21

dirstate,

22

encoding,

22

encoding,

23

error,

23

error,

24

httpconnection,

24

httpconnection,

25

match as matchmod,

25

match as matchmod,

26

node,

26

node,

27

pycompat,

27

pycompat,

28

scmutil,

28

scmutil,

29

util,

29

util,

30

vfs as vfsmod,

30

vfs as vfsmod,

31

)

31

)

32

33

shortname = '.hglf'

33

shortname = '.hglf'

34

shortnameslash = shortname + '/'

34

shortnameslash = shortname + '/'

35

longname = 'largefiles'

35

longname = 'largefiles'

36

37

# -- Private worker functions ------------------------------------------

37

# -- Private worker functions ------------------------------------------

38

39

def getminsize(ui, assumelfiles, opt, default=10):

39

def getminsize(ui, assumelfiles, opt, default=10):

40

lfsize = opt

40

lfsize = opt

41

if not lfsize and assumelfiles:

41

if not lfsize and assumelfiles:

42

lfsize = ui.config(longname, 'minsize', default=default)

42

lfsize = ui.config(longname, 'minsize', default=default)

43

if lfsize:

43

if lfsize:

44

try:

44

try:

45

lfsize = float(lfsize)

45

lfsize = float(lfsize)

46

except ValueError:

46

except ValueError:

47

raise error.Abort(_('largefiles: size must be number (not %s)\n')

47

raise error.Abort(_('largefiles: size must be number (not %s)\n')

48

% lfsize)

48

% lfsize)

49

if lfsize is None:

49

if lfsize is None:

50

raise error.Abort(_('minimum size for largefiles must be specified'))

50

raise error.Abort(_('minimum size for largefiles must be specified'))

51

return lfsize

51

return lfsize

52

53

def link(src, dest):

53

def link(src, dest):

54

"""Try to create hardlink - if that fails, efficiently make a copy."""

54

"""Try to create hardlink - if that fails, efficiently make a copy."""

55

util.makedirs(os.path.dirname(dest))

55

util.makedirs(os.path.dirname(dest))

56

try:

56

try:

57

util.oslink(src, dest)

57

util.oslink(src, dest)

58

except OSError:

58

except OSError:

59

# if hardlinks fail, fallback on atomic copy

59

# if hardlinks fail, fallback on atomic copy

60

with open(src, 'rb') as srcf:

60

with open(src, 'rb') as srcf:

61

with util.atomictempfile(dest) as dstf:

61

with util.atomictempfile(dest) as dstf:

62

for chunk in util.filechunkiter(srcf):

62

for chunk in util.filechunkiter(srcf):

63

dstf.write(chunk)

63

dstf.write(chunk)

64

os.chmod(dest, os.stat(src).st_mode)

64

os.chmod(dest, os.stat(src).st_mode)

65

66

def usercachepath(ui, hash):

66

def usercachepath(ui, hash):

67

'''Return the correct location in the "global" largefiles cache for a file

67

'''Return the correct location in the "global" largefiles cache for a file

68

with the given hash.

68

with the given hash.

69

This cache is used for sharing of largefiles across repositories - both

69

This cache is used for sharing of largefiles across repositories - both

70

to preserve download bandwidth and storage space.'''

70

to preserve download bandwidth and storage space.'''

71

return os.path.join(_usercachedir(ui), hash)

71

return os.path.join(_usercachedir(ui), hash)

72

73

def _usercachedir(ui):

73

def _usercachedir(ui):

74

'''Return the location of the "global" largefiles cache.'''

74

'''Return the location of the "global" largefiles cache.'''

75

path = ui.configpath(longname, 'usercache', None)

75

path = ui.configpath(longname, 'usercache', None)

76

if path:

76

if path:

77

return path

77

return path

78

if pycompat.osname == 'nt':

78

if pycompat.osname == 'nt':

79

appdata = encoding.environ.get('LOCALAPPDATA',\

79

appdata = encoding.environ.get('LOCALAPPDATA',\

80

encoding.environ.get('APPDATA'))

80

encoding.environ.get('APPDATA'))

81

if appdata:

81

if appdata:

82

return os.path.join(appdata, longname)

82

return os.path.join(appdata, longname)

83

elif platform.system() == 'Darwin':

83

elif platform.system() == 'Darwin':

84

home = encoding.environ.get('HOME')

84

home = encoding.environ.get('HOME')

85

if home:

85

if home:

86

return os.path.join(home, 'Library', 'Caches', longname)

86

return os.path.join(home, 'Library', 'Caches', longname)

87

elif pycompat.osname == 'posix':

87

elif pycompat.osname == 'posix':

88

path = encoding.environ.get('XDG_CACHE_HOME')

88

path = encoding.environ.get('XDG_CACHE_HOME')

89

if path:

89

if path:

90

return os.path.join(path, longname)

90

return os.path.join(path, longname)

91

home = encoding.environ.get('HOME')

91

home = encoding.environ.get('HOME')

92

if home:

92

if home:

93

return os.path.join(home, '.cache', longname)

93

return os.path.join(home, '.cache', longname)

94

else:

94

else:

95

raise error.Abort(_('unknown operating system: %s\n')

95

raise error.Abort(_('unknown operating system: %s\n')

96

% pycompat.osname)

96

% pycompat.osname)

97

raise error.Abort(_('unknown %s usercache location') % longname)

97

raise error.Abort(_('unknown %s usercache location') % longname)

98

99

def inusercache(ui, hash):

99

def inusercache(ui, hash):

100

path = usercachepath(ui, hash)

100

path = usercachepath(ui, hash)

101

return os.path.exists(path)

101

return os.path.exists(path)

102

103

def findfile(repo, hash):

103

def findfile(repo, hash):

104

'''Return store path of the largefile with the specified hash.

104

'''Return store path of the largefile with the specified hash.

105

As a side effect, the file might be linked from user cache.

105

As a side effect, the file might be linked from user cache.

106

Return None if the file can't be found locally.'''

106

Return None if the file can't be found locally.'''

107

path, exists = findstorepath(repo, hash)

107

path, exists = findstorepath(repo, hash)

108

if exists:

108

if exists:

109

repo.ui.note(_('found %s in store\n') % hash)

109

repo.ui.note(_('found %s in store\n') % hash)

110

return path

110

return path

111

elif inusercache(repo.ui, hash):

111

elif inusercache(repo.ui, hash):

112

repo.ui.note(_('found %s in system cache\n') % hash)

112

repo.ui.note(_('found %s in system cache\n') % hash)

113

path = storepath(repo, hash)

113

path = storepath(repo, hash)

114

link(usercachepath(repo.ui, hash), path)

114

link(usercachepath(repo.ui, hash), path)

115

return path

115

return path

116

return None

116

return None

117

118

class largefilesdirstate(dirstate.dirstate):

118

class largefilesdirstate(dirstate.dirstate):

119

def __getitem__(self, key):

119

def __getitem__(self, key):

120

return super(largefilesdirstate, self).__getitem__(unixpath(key))

120

return super(largefilesdirstate, self).__getitem__(unixpath(key))

121

def normal(self, f):

121

def normal(self, f):

122

return super(largefilesdirstate, self).normal(unixpath(f))

122

return super(largefilesdirstate, self).normal(unixpath(f))

123

def remove(self, f):

123

def remove(self, f):

124

return super(largefilesdirstate, self).remove(unixpath(f))

124

return super(largefilesdirstate, self).remove(unixpath(f))

125

def add(self, f):

125

def add(self, f):

126

return super(largefilesdirstate, self).add(unixpath(f))

126

return super(largefilesdirstate, self).add(unixpath(f))

127

def drop(self, f):

127

def drop(self, f):

128

return super(largefilesdirstate, self).drop(unixpath(f))

128

return super(largefilesdirstate, self).drop(unixpath(f))

129

def forget(self, f):

129

def forget(self, f):

130

return super(largefilesdirstate, self).forget(unixpath(f))

130

return super(largefilesdirstate, self).forget(unixpath(f))

131

def normallookup(self, f):

131

def normallookup(self, f):

132

return super(largefilesdirstate, self).normallookup(unixpath(f))

132

return super(largefilesdirstate, self).normallookup(unixpath(f))

133

def _ignore(self, f):

133

def _ignore(self, f):

134

return False

134

return False

135

def write(self, tr=False):

135

def write(self, tr=False):

136

# (1) disable PENDING mode always

136

# (1) disable PENDING mode always

137

# (lfdirstate isn't yet managed as a part of the transaction)

137

# (lfdirstate isn't yet managed as a part of the transaction)

138

# (2) avoid develwarn 'use dirstate.write with ....'

138

# (2) avoid develwarn 'use dirstate.write with ....'

139

super(largefilesdirstate, self).write(None)

139

super(largefilesdirstate, self).write(None)

140

141

def openlfdirstate(ui, repo, create=True):

141

def openlfdirstate(ui, repo, create=True):

142

'''

142

'''

143

Return a dirstate object that tracks largefiles: i.e. its root is

143

Return a dirstate object that tracks largefiles: i.e. its root is

144

the repo root, but it is saved in .hg/largefiles/dirstate.

144

the repo root, but it is saved in .hg/largefiles/dirstate.

145

'''

145

'''

146

vfs = repo.vfs

146

vfs = repo.vfs

147

lfstoredir = longname

147

lfstoredir = longname

148

opener = vfsmod.vfs(vfs.join(lfstoredir))

148

opener = vfsmod.vfs(vfs.join(lfstoredir))

149

lfdirstate = largefilesdirstate(opener, ui, repo.root,

149

lfdirstate = largefilesdirstate(opener, ui, repo.root,

150

repo.dirstate._validate)

150

repo.dirstate._validate)

151

152

# If the largefiles dirstate does not exist, populate and create

152

# If the largefiles dirstate does not exist, populate and create

153

# it. This ensures that we create it on the first meaningful

153

# it. This ensures that we create it on the first meaningful

154

# largefiles operation in a new clone.

154

# largefiles operation in a new clone.

155

if create and not vfs.exists(vfs.join(lfstoredir, 'dirstate')):

155

if create and not vfs.exists(vfs.join(lfstoredir, 'dirstate')):

156

matcher = getstandinmatcher(repo)

156

matcher = getstandinmatcher(repo)

157

standins = repo.dirstate.walk(matcher, [], False, False)

157

standins = repo.dirstate.walk(matcher, [], False, False)

158

159

if len(standins) > 0:

159

if len(standins) > 0:

160

vfs.makedirs(lfstoredir)

160

vfs.makedirs(lfstoredir)

161

162

for standin in standins:

162

for standin in standins:

163

lfile = splitstandin(standin)

163

lfile = splitstandin(standin)

164

lfdirstate.normallookup(lfile)

164

lfdirstate.normallookup(lfile)

165

return lfdirstate

165

return lfdirstate

166

167

def lfdirstatestatus(lfdirstate, repo):

167

def lfdirstatestatus(lfdirstate, repo):

168

pctx = repo['.']

168

pctx = repo['.']

169

match = matchmod.always(repo.root, repo.getcwd())

169

match = matchmod.always(repo.root, repo.getcwd())

170

unsure, s = lfdirstate.status(match, [], False, False, False)

170

unsure, s = lfdirstate.status(match, [], False, False, False)

171

modified, clean = s.modified, s.clean

171

modified, clean = s.modified, s.clean

172

for lfile in unsure:

172

for lfile in unsure:

173

try:

173

try:

174

fctx = pctx[standin(lfile)]

174

fctx = pctx[standin(lfile)]

175

except LookupError:

175

except LookupError:

176

fctx = None

176

fctx = None

177

if not fctx or fctx.data().strip() != hashfile(repo.wjoin(lfile)):

177

if not fctx or fctx.data().strip() != hashfile(repo.wjoin(lfile)):

178

modified.append(lfile)

178

modified.append(lfile)

179

else:

179

else:

180

clean.append(lfile)

180

clean.append(lfile)

181

lfdirstate.normal(lfile)

181

lfdirstate.normal(lfile)

182

return s

182

return s

183

184

def listlfiles(repo, rev=None, matcher=None):

184

def listlfiles(repo, rev=None, matcher=None):

185

'''return a list of largefiles in the working copy or the

185

'''return a list of largefiles in the working copy or the

186

specified changeset'''

186

specified changeset'''

187

188

if matcher is None:

188

if matcher is None:

189

matcher = getstandinmatcher(repo)

189

matcher = getstandinmatcher(repo)

190

191

# ignore unknown files in working directory

191

# ignore unknown files in working directory

192

return [splitstandin(f)

192

return [splitstandin(f)

193

for f in repo[rev].walk(matcher)

193

for f in repo[rev].walk(matcher)

194

if rev is not None or repo.dirstate[f] != '?']

194

if rev is not None or repo.dirstate[f] != '?']

195

196

def instore(repo, hash, forcelocal=False):

196

def instore(repo, hash, forcelocal=False):

197

'''Return true if a largefile with the given hash exists in the store'''

197

'''Return true if a largefile with the given hash exists in the store'''

198

return os.path.exists(storepath(repo, hash, forcelocal))

198

return os.path.exists(storepath(repo, hash, forcelocal))

199

200

def storepath(repo, hash, forcelocal=False):

200

def storepath(repo, hash, forcelocal=False):

201

'''Return the correct location in the repository largefiles store for a

201

'''Return the correct location in the repository largefiles store for a

202

file with the given hash.'''

202

file with the given hash.'''

203

if not forcelocal and repo.shared():

203

if not forcelocal and repo.shared():

204

return repo.vfs.reljoin(repo.sharedpath, longname, hash)

204

return repo.vfs.reljoin(repo.sharedpath, longname, hash)

205

return repo.vfs.join(longname, hash)

205

return repo.vfs.join(longname, hash)

206

207

def findstorepath(repo, hash):

207

def findstorepath(repo, hash):

208

'''Search through the local store path(s) to find the file for the given

208

'''Search through the local store path(s) to find the file for the given

209

hash. If the file is not found, its path in the primary store is returned.

209

hash. If the file is not found, its path in the primary store is returned.

210

The return value is a tuple of (path, exists(path)).

210

The return value is a tuple of (path, exists(path)).

211

'''

211

'''

212

# For shared repos, the primary store is in the share source. But for

212

# For shared repos, the primary store is in the share source. But for

213

# backward compatibility, force a lookup in the local store if it wasn't

213

# backward compatibility, force a lookup in the local store if it wasn't

214

# found in the share source.

214

# found in the share source.

215

path = storepath(repo, hash, False)

215

path = storepath(repo, hash, False)

216

217

if instore(repo, hash):

217

if instore(repo, hash):

218

return (path, True)

218

return (path, True)

219

elif repo.shared() and instore(repo, hash, True):

219

elif repo.shared() and instore(repo, hash, True):

220

return storepath(repo, hash, True), True

220

return storepath(repo, hash, True), True

221

222

return (path, False)

222

return (path, False)

223

224

def copyfromcache(repo, hash, filename):

224

def copyfromcache(repo, hash, filename):

225

'''Copy the specified largefile from the repo or system cache to

225

'''Copy the specified largefile from the repo or system cache to

226

filename in the repository. Return true on success or false if the

226

filename in the repository. Return true on success or false if the

227

file was not found in either cache (which should not happened:

227

file was not found in either cache (which should not happened:

228

this is meant to be called only after ensuring that the needed

228

this is meant to be called only after ensuring that the needed

229

largefile exists in the cache).'''

229

largefile exists in the cache).'''

230

wvfs = repo.wvfs

230

wvfs = repo.wvfs

231

path = findfile(repo, hash)

231

path = findfile(repo, hash)

232

if path is None:

232

if path is None:

233

return False

233

return False

234

wvfs.makedirs(wvfs.dirname(wvfs.join(filename)))

234

wvfs.makedirs(wvfs.dirname(wvfs.join(filename)))

235

# The write may fail before the file is fully written, but we

235

# The write may fail before the file is fully written, but we

236

# don't use atomic writes in the working copy.

236

# don't use atomic writes in the working copy.

237

with open(path, 'rb') as srcfd:

237

with open(path, 'rb') as srcfd:

238

with wvfs(filename, 'wb') as destfd:

238

with wvfs(filename, 'wb') as destfd:

239

gothash = copyandhash(

239

gothash = copyandhash(

240

util.filechunkiter(srcfd), destfd)

240

util.filechunkiter(srcfd), destfd)

241

if gothash != hash:

241

if gothash != hash:

242

repo.ui.warn(_('%s: data corruption in %s with hash %s\n')

242

repo.ui.warn(_('%s: data corruption in %s with hash %s\n')

243

% (filename, path, gothash))

243

% (filename, path, gothash))

244

wvfs.unlink(filename)

244

wvfs.unlink(filename)

245

return False

245

return False

246

return True

246

return True

247

248

def copytostore(repo, revorctx, file, uploaded=False):

248

def copytostore(repo, revorctx, file, uploaded=False):

249

wvfs = repo.wvfs

249

wvfs = repo.wvfs

250

hash = readstandin(repo, file, revorctx)

250

hash = readstandin(repo, file, revorctx)

251

if instore(repo, hash):

251

if instore(repo, hash):

252

return

252

return

253

if wvfs.exists(file):

253

if wvfs.exists(file):

254

copytostoreabsolute(repo, wvfs.join(file), hash)

254

copytostoreabsolute(repo, wvfs.join(file), hash)

255

else:

255

else:

256

repo.ui.warn(_("%s: largefile %s not available from local store\n") %

256

repo.ui.warn(_("%s: largefile %s not available from local store\n") %

257

(file, hash))

257

(file, hash))

258

259

def copyalltostore(repo, node):

259

def copyalltostore(repo, node):

260

'''Copy all largefiles in a given revision to the store'''

260

'''Copy all largefiles in a given revision to the store'''

261

262

ctx = repo[node]

262

ctx = repo[node]

263

for filename in ctx.files():

263

for filename in ctx.files():

264

realfile = splitstandin(filename)

264

realfile = splitstandin(filename)

265

if realfile is not None and filename in ctx.manifest():

265

if realfile is not None and filename in ctx.manifest():

266

copytostore(repo, ctx, realfile)

266

copytostore(repo, ctx, realfile)

267

268

def copytostoreabsolute(repo, file, hash):

268

def copytostoreabsolute(repo, file, hash):

269

if inusercache(repo.ui, hash):

269

if inusercache(repo.ui, hash):

270

link(usercachepath(repo.ui, hash), storepath(repo, hash))

270

link(usercachepath(repo.ui, hash), storepath(repo, hash))

271

else:

271

else:

272

util.makedirs(os.path.dirname(storepath(repo, hash)))

272

util.makedirs(os.path.dirname(storepath(repo, hash)))

273

with open(file, 'rb') as srcf:

273

with open(file, 'rb') as srcf:

274

with util.atomictempfile(storepath(repo, hash),

274

with util.atomictempfile(storepath(repo, hash),

275

createmode=repo.store.createmode) as dstf:

275

createmode=repo.store.createmode) as dstf:

276

for chunk in util.filechunkiter(srcf):

276

for chunk in util.filechunkiter(srcf):

277

dstf.write(chunk)

277

dstf.write(chunk)

278

linktousercache(repo, hash)

278

linktousercache(repo, hash)

279

280

def linktousercache(repo, hash):

280

def linktousercache(repo, hash):

281

'''Link / copy the largefile with the specified hash from the store

281

'''Link / copy the largefile with the specified hash from the store

282

to the cache.'''

282

to the cache.'''

283

path = usercachepath(repo.ui, hash)

283

path = usercachepath(repo.ui, hash)

284

link(storepath(repo, hash), path)

284

link(storepath(repo, hash), path)

285

286

def getstandinmatcher(repo, rmatcher=None):

286

def getstandinmatcher(repo, rmatcher=None):

287

'''Return a match object that applies rmatcher to the standin directory'''

287

'''Return a match object that applies rmatcher to the standin directory'''

288

wvfs = repo.wvfs

288

wvfs = repo.wvfs

289

standindir = shortname

289

standindir = shortname

290

291

# no warnings about missing files or directories

291

# no warnings about missing files or directories

292

badfn = lambda f, msg: None

292

badfn = lambda f, msg: None

293

294

if rmatcher and not rmatcher.always():

294

if rmatcher and not rmatcher.always():

295

pats = [wvfs.join(standindir, pat) for pat in rmatcher.files()]

295

pats = [wvfs.join(standindir, pat) for pat in rmatcher.files()]

296

if not pats:

296

if not pats:

297

pats = [wvfs.join(standindir)]

297

pats = [wvfs.join(standindir)]

298

match = scmutil.match(repo[None], pats, badfn=badfn)

298

match = scmutil.match(repo[None], pats, badfn=badfn)

299

# if pats is empty, it would incorrectly always match, so clear _always

299

# if pats is empty, it would incorrectly always match, so clear _always

300

match._always = False

300

match._always = False

301

else:

301

else:

302

# no patterns: relative to repo root

302

# no patterns: relative to repo root

303

match = scmutil.match(repo[None], [wvfs.join(standindir)], badfn=badfn)

303

match = scmutil.match(repo[None], [wvfs.join(standindir)], badfn=badfn)

304

return match

304

return match

305

306

def composestandinmatcher(repo, rmatcher):

306

def composestandinmatcher(repo, rmatcher):

307

'''Return a matcher that accepts standins corresponding to the

307

'''Return a matcher that accepts standins corresponding to the

308

files accepted by rmatcher. Pass the list of files in the matcher

308

files accepted by rmatcher. Pass the list of files in the matcher

309

as the paths specified by the user.'''

309

as the paths specified by the user.'''

310

smatcher = getstandinmatcher(repo, rmatcher)

310

smatcher = getstandinmatcher(repo, rmatcher)

311

isstandin = smatcher.matchfn

311

isstandin = smatcher.matchfn

312

def composedmatchfn(f):

312

def composedmatchfn(f):

313

return isstandin(f) and rmatcher.matchfn(splitstandin(f))

313

return isstandin(f) and rmatcher.matchfn(splitstandin(f))

314

smatcher.matchfn = composedmatchfn

314

smatcher.matchfn = composedmatchfn

315

316

return smatcher

316

return smatcher

317

318

def standin(filename):

318

def standin(filename):

319

'''Return the repo-relative path to the standin for the specified big

319

'''Return the repo-relative path to the standin for the specified big

320

file.'''

320

file.'''

321

# Notes:

321

# Notes:

322

# 1) Some callers want an absolute path, but for instance addlargefiles

322

# 1) Some callers want an absolute path, but for instance addlargefiles

323

# needs it repo-relative so it can be passed to repo[None].add(). So

323

# needs it repo-relative so it can be passed to repo[None].add(). So

324

# leave it up to the caller to use repo.wjoin() to get an absolute path.

324

# leave it up to the caller to use repo.wjoin() to get an absolute path.

325

# 2) Join with '/' because that's what dirstate always uses, even on

325

# 2) Join with '/' because that's what dirstate always uses, even on

326

# Windows. Change existing separator to '/' first in case we are

326

# Windows. Change existing separator to '/' first in case we are

327

# passed filenames from an external source (like the command line).

327

# passed filenames from an external source (like the command line).

328

return shortnameslash + util.pconvert(filename)

328

return shortnameslash + util.pconvert(filename)

329

330

def isstandin(filename):

330

def isstandin(filename):

331

'''Return true if filename is a big file standin. filename must be

331

'''Return true if filename is a big file standin. filename must be

332

in Mercurial's internal form (slash-separated).'''

332

in Mercurial's internal form (slash-separated).'''

333

return filename.startswith(shortnameslash)

333

return filename.startswith(shortnameslash)

334

335

def splitstandin(filename):

335

def splitstandin(filename):

336

# Split on / because that's what dirstate always uses, even on Windows.

336

# Split on / because that's what dirstate always uses, even on Windows.

337

# Change local separator to / first just in case we are passed filenames

337

# Change local separator to / first just in case we are passed filenames

338

# from an external source (like the command line).

338

# from an external source (like the command line).

339

bits = util.pconvert(filename).split('/', 1)

339

bits = util.pconvert(filename).split('/', 1)

340

if len(bits) == 2 and bits[0] == shortname:

340

if len(bits) == 2 and bits[0] == shortname:

341

return bits[1]

341

return bits[1]

342

else:

342

else:

343

return None

343

return None

344

345

def updatestandin(repo, lfile, standin):

345

def updatestandin(repo, lfile, standin):

346

"""Re-calculate hash value of lfile and write it into standin

346

"""Re-calculate hash value of lfile and write it into standin

347

348

This assumes that "lfutil.standin(lfile) == standin", for efficiency.

348

This assumes that "lfutil.standin(lfile) == standin", for efficiency.

349

"""

349

"""

350

file = repo.wjoin(lfile)

350

file = repo.wjoin(lfile)

351

if repo.wvfs.exists(lfile):

351

if repo.wvfs.exists(lfile):

352

hash = hashfile(file)

352

hash = hashfile(file)

353

executable = getexecutable(file)

353

executable = getexecutable(file)

354

writestandin(repo, standin, hash, executable)

354

writestandin(repo, standin, hash, executable)

355

else:

355

else:

356

raise error.Abort(_('%s: file not found!') % lfile)

356

raise error.Abort(_('%s: file not found!') % lfile)

357

358

def readasstandin(fctx):

359

'''read hex hash from given filectx of standin file

360

361

This encapsulates how "standin" data is stored into storage layer.'''

362

return fctx.data().strip()

363

358

def readstandin(repo, filename, node=None):

364

def readstandin(repo, filename, node=None):

359

'''read hex hash from standin for filename at given node, or working

365

'''read hex hash from standin for filename at given node, or working

360

directory if no node is given'''

366

directory if no node is given'''

361

return repo[node][standin(filename)].~~data~~().~~strip~~()

367

return readasstandin(repo[node][standin(filename)])

362

368

363

def writestandin(repo, standin, hash, executable):

369

def writestandin(repo, standin, hash, executable):

364

'''write hash to <repo.root>/<standin>'''

370

'''write hash to <repo.root>/<standin>'''

365

repo.wwrite(standin, hash + '\n', executable and 'x' or '')

371

repo.wwrite(standin, hash + '\n', executable and 'x' or '')

366

372

367

def copyandhash(instream, outfile):

373

def copyandhash(instream, outfile):

368

'''Read bytes from instream (iterable) and write them to outfile,

374

'''Read bytes from instream (iterable) and write them to outfile,

369

computing the SHA-1 hash of the data along the way. Return the hash.'''

375

computing the SHA-1 hash of the data along the way. Return the hash.'''

370

hasher = hashlib.sha1('')

376

hasher = hashlib.sha1('')

371

for data in instream:

377

for data in instream:

372

hasher.update(data)

378

hasher.update(data)

373

outfile.write(data)

379

outfile.write(data)

374

return hasher.hexdigest()

380

return hasher.hexdigest()

375

381

376

def hashfile(file):

382

def hashfile(file):

377

if not os.path.exists(file):

383

if not os.path.exists(file):

378

return ''

384

return ''

379

with open(file, 'rb') as fd:

385

with open(file, 'rb') as fd:

380

return hexsha1(fd)

386

return hexsha1(fd)

381

387

382

def getexecutable(filename):

388

def getexecutable(filename):

383

mode = os.stat(filename).st_mode

389

mode = os.stat(filename).st_mode

384

return ((mode & stat.S_IXUSR) and

390

return ((mode & stat.S_IXUSR) and

385

(mode & stat.S_IXGRP) and

391

(mode & stat.S_IXGRP) and

386

(mode & stat.S_IXOTH))

392

(mode & stat.S_IXOTH))

387

393

388

def urljoin(first, second, *arg):

394

def urljoin(first, second, *arg):

389

def join(left, right):

395

def join(left, right):

390

if not left.endswith('/'):

396

if not left.endswith('/'):

391

left += '/'

397

left += '/'

392

if right.startswith('/'):

398

if right.startswith('/'):

393

right = right[1:]

399

right = right[1:]

394

return left + right

400

return left + right

395

401

396

url = join(first, second)

402

url = join(first, second)

397

for a in arg:

403

for a in arg:

398

url = join(url, a)

404

url = join(url, a)

399

return url

405

return url

400

406

401

def hexsha1(fileobj):

407

def hexsha1(fileobj):

402

"""hexsha1 returns the hex-encoded sha1 sum of the data in the file-like

408

"""hexsha1 returns the hex-encoded sha1 sum of the data in the file-like

403

object data"""

409

object data"""

404

h = hashlib.sha1()

410

h = hashlib.sha1()

405

for chunk in util.filechunkiter(fileobj):

411

for chunk in util.filechunkiter(fileobj):

406

h.update(chunk)

412

h.update(chunk)

407

return h.hexdigest()

413

return h.hexdigest()

408

414

409

def httpsendfile(ui, filename):

415

def httpsendfile(ui, filename):

410

return httpconnection.httpsendfile(ui, filename, 'rb')

416

return httpconnection.httpsendfile(ui, filename, 'rb')

411

417

412

def unixpath(path):

418

def unixpath(path):

413

'''Return a version of path normalized for use with the lfdirstate.'''

419

'''Return a version of path normalized for use with the lfdirstate.'''

414

return util.pconvert(os.path.normpath(path))

420

return util.pconvert(os.path.normpath(path))

415

421

416

def islfilesrepo(repo):

422

def islfilesrepo(repo):

417

'''Return true if the repo is a largefile repo.'''

423

'''Return true if the repo is a largefile repo.'''

418

if ('largefiles' in repo.requirements and

424

if ('largefiles' in repo.requirements and

419

any(shortnameslash in f[0] for f in repo.store.datafiles())):

425

any(shortnameslash in f[0] for f in repo.store.datafiles())):

420

return True

426

return True

421

427

422

return any(openlfdirstate(repo.ui, repo, False))

428

return any(openlfdirstate(repo.ui, repo, False))

423

429

424

class storeprotonotcapable(Exception):

430

class storeprotonotcapable(Exception):

425

def __init__(self, storetypes):

431

def __init__(self, storetypes):

426

self.storetypes = storetypes

432

self.storetypes = storetypes

427

433

428

def getstandinsstate(repo):

434

def getstandinsstate(repo):

429

standins = []

435

standins = []

430

matcher = getstandinmatcher(repo)

436

matcher = getstandinmatcher(repo)

431

for standin in repo.dirstate.walk(matcher, [], False, False):

437

for standin in repo.dirstate.walk(matcher, [], False, False):

432

lfile = splitstandin(standin)

438

lfile = splitstandin(standin)

433

try:

439

try:

434

hash = readstandin(repo, lfile)

440

hash = readstandin(repo, lfile)

435

except IOError:

441

except IOError:

436

hash = None

442

hash = None

437

standins.append((lfile, hash))

443

standins.append((lfile, hash))

438

return standins

444

return standins

439

445

440

def synclfdirstate(repo, lfdirstate, lfile, normallookup):

446

def synclfdirstate(repo, lfdirstate, lfile, normallookup):

441

lfstandin = standin(lfile)

447

lfstandin = standin(lfile)

442

if lfstandin in repo.dirstate:

448

if lfstandin in repo.dirstate:

443

stat = repo.dirstate._map[lfstandin]

449

stat = repo.dirstate._map[lfstandin]

444

state, mtime = stat[0], stat[3]

450

state, mtime = stat[0], stat[3]

445

else:

451

else:

446

state, mtime = '?', -1

452

state, mtime = '?', -1

447

if state == 'n':

453

if state == 'n':

448

if (normallookup or mtime < 0 or

454

if (normallookup or mtime < 0 or

449

not repo.wvfs.exists(lfile)):

455

not repo.wvfs.exists(lfile)):

450

# state 'n' doesn't ensure 'clean' in this case

456

# state 'n' doesn't ensure 'clean' in this case

451

lfdirstate.normallookup(lfile)

457

lfdirstate.normallookup(lfile)

452

else:

458

else:

453

lfdirstate.normal(lfile)

459

lfdirstate.normal(lfile)

454

elif state == 'm':

460

elif state == 'm':

455

lfdirstate.normallookup(lfile)

461

lfdirstate.normallookup(lfile)

456

elif state == 'r':

462

elif state == 'r':

457

lfdirstate.remove(lfile)

463

lfdirstate.remove(lfile)

458

elif state == 'a':

464

elif state == 'a':

459

lfdirstate.add(lfile)

465

lfdirstate.add(lfile)

460

elif state == '?':

466

elif state == '?':

461

lfdirstate.drop(lfile)

467

lfdirstate.drop(lfile)

462

468

463

def markcommitted(orig, ctx, node):

469

def markcommitted(orig, ctx, node):

464

repo = ctx.repo()

470

repo = ctx.repo()

465

471

466

orig(node)

472

orig(node)

467

473

468

# ATTENTION: "ctx.files()" may differ from "repo[node].files()"

474

# ATTENTION: "ctx.files()" may differ from "repo[node].files()"

469

# because files coming from the 2nd parent are omitted in the latter.

475

# because files coming from the 2nd parent are omitted in the latter.

470

#

476

#

471

# The former should be used to get targets of "synclfdirstate",

477

# The former should be used to get targets of "synclfdirstate",

472

# because such files:

478

# because such files:

473

# - are marked as "a" by "patch.patch()" (e.g. via transplant), and

479

# - are marked as "a" by "patch.patch()" (e.g. via transplant), and

474

# - have to be marked as "n" after commit, but

480

# - have to be marked as "n" after commit, but

475

# - aren't listed in "repo[node].files()"

481

# - aren't listed in "repo[node].files()"

476

482

477

lfdirstate = openlfdirstate(repo.ui, repo)

483

lfdirstate = openlfdirstate(repo.ui, repo)

478

for f in ctx.files():

484

for f in ctx.files():

479

lfile = splitstandin(f)

485

lfile = splitstandin(f)

480

if lfile is not None:

486

if lfile is not None:

481

synclfdirstate(repo, lfdirstate, lfile, False)

487

synclfdirstate(repo, lfdirstate, lfile, False)

482

lfdirstate.write()

488

lfdirstate.write()

483

489

484

# As part of committing, copy all of the largefiles into the cache.

490

# As part of committing, copy all of the largefiles into the cache.

485

#

491

#

486

# Using "node" instead of "ctx" implies additional "repo[node]"

492

# Using "node" instead of "ctx" implies additional "repo[node]"

487

# lookup while copyalltostore(), but can omit redundant check for

493

# lookup while copyalltostore(), but can omit redundant check for

488

# files comming from the 2nd parent, which should exist in store

494

# files comming from the 2nd parent, which should exist in store

489

# at merging.

495

# at merging.

490

copyalltostore(repo, node)

496

copyalltostore(repo, node)

491

497

492

def getlfilestoupdate(oldstandins, newstandins):

498

def getlfilestoupdate(oldstandins, newstandins):

493

changedstandins = set(oldstandins).symmetric_difference(set(newstandins))

499

changedstandins = set(oldstandins).symmetric_difference(set(newstandins))

494

filelist = []

500

filelist = []

495

for f in changedstandins:

501

for f in changedstandins:

496

if f[0] not in filelist:

502

if f[0] not in filelist:

497

filelist.append(f[0])

503

filelist.append(f[0])

498

return filelist

504

return filelist

499

505

500

def getlfilestoupload(repo, missing, addfunc):

506

def getlfilestoupload(repo, missing, addfunc):

501

for i, n in enumerate(missing):

507

for i, n in enumerate(missing):

502

repo.ui.progress(_('finding outgoing largefiles'), i,

508

repo.ui.progress(_('finding outgoing largefiles'), i,

503

unit=_('revisions'), total=len(missing))

509

unit=_('revisions'), total=len(missing))

504

parents = [p for p in repo[n].parents() if p != node.nullid]

510

parents = [p for p in repo[n].parents() if p != node.nullid]

505

511

506

oldlfstatus = repo.lfstatus

512

oldlfstatus = repo.lfstatus

507

repo.lfstatus = False

513

repo.lfstatus = False

508

try:

514

try:

509

ctx = repo[n]

515

ctx = repo[n]

510

finally:

516

finally:

511

repo.lfstatus = oldlfstatus

517

repo.lfstatus = oldlfstatus

512

518

513

files = set(ctx.files())

519

files = set(ctx.files())

514

if len(parents) == 2:

520

if len(parents) == 2:

515

mc = ctx.manifest()

521

mc = ctx.manifest()

516

mp1 = ctx.parents()[0].manifest()

522

mp1 = ctx.parents()[0].manifest()

517

mp2 = ctx.parents()[1].manifest()

523

mp2 = ctx.parents()[1].manifest()

518

for f in mp1:

524

for f in mp1:

519

if f not in mc:

525

if f not in mc:

520

files.add(f)

526

files.add(f)

521

for f in mp2:

527

for f in mp2:

522

if f not in mc:

528

if f not in mc:

523

files.add(f)

529

files.add(f)

524

for f in mc:

530

for f in mc:

525

if mc[f] != mp1.get(f, None) or mc[f] != mp2.get(f, None):

531

if mc[f] != mp1.get(f, None) or mc[f] != mp2.get(f, None):

526

files.add(f)

532

files.add(f)

527

for fn in files:

533

for fn in files:

528

if isstandin(fn) and fn in ctx:

534

if isstandin(fn) and fn in ctx:

529

addfunc(fn, ctx[fn].data().strip())

535

addfunc(fn, ctx[fn].data().strip())

530

repo.ui.progress(_('finding outgoing largefiles'), None)

536

repo.ui.progress(_('finding outgoing largefiles'), None)

531

537

532

def updatestandinsbymatch(repo, match):

538

def updatestandinsbymatch(repo, match):

533

'''Update standins in the working directory according to specified match

539

'''Update standins in the working directory according to specified match

534

540

535

This returns (possibly modified) ``match`` object to be used for

541

This returns (possibly modified) ``match`` object to be used for

536

subsequent commit process.

542

subsequent commit process.

537

'''

543

'''

538

544

539

ui = repo.ui

545

ui = repo.ui

540

546

541

# Case 1: user calls commit with no specific files or

547

# Case 1: user calls commit with no specific files or

542

# include/exclude patterns: refresh and commit all files that

548

# include/exclude patterns: refresh and commit all files that

543

# are "dirty".

549

# are "dirty".

544

if match is None or match.always():

550

if match is None or match.always():

545

# Spend a bit of time here to get a list of files we know

551

# Spend a bit of time here to get a list of files we know

546

# are modified so we can compare only against those.

552

# are modified so we can compare only against those.

547

# It can cost a lot of time (several seconds)

553

# It can cost a lot of time (several seconds)

548

# otherwise to update all standins if the largefiles are

554

# otherwise to update all standins if the largefiles are

549

# large.

555

# large.

550

lfdirstate = openlfdirstate(ui, repo)

556

lfdirstate = openlfdirstate(ui, repo)

551

dirtymatch = matchmod.always(repo.root, repo.getcwd())

557

dirtymatch = matchmod.always(repo.root, repo.getcwd())

552

unsure, s = lfdirstate.status(dirtymatch, [], False, False,

558

unsure, s = lfdirstate.status(dirtymatch, [], False, False,

553

False)

559

False)

554

modifiedfiles = unsure + s.modified + s.added + s.removed

560

modifiedfiles = unsure + s.modified + s.added + s.removed

555

lfiles = listlfiles(repo)

561

lfiles = listlfiles(repo)

556

# this only loops through largefiles that exist (not

562

# this only loops through largefiles that exist (not

557

# removed/renamed)

563

# removed/renamed)

558

for lfile in lfiles:

564

for lfile in lfiles:

559

if lfile in modifiedfiles:

565

if lfile in modifiedfiles:

560

fstandin = standin(lfile)

566

fstandin = standin(lfile)

561

if repo.wvfs.exists(fstandin):

567

if repo.wvfs.exists(fstandin):

562

# this handles the case where a rebase is being

568

# this handles the case where a rebase is being

563

# performed and the working copy is not updated

569

# performed and the working copy is not updated

564

# yet.

570

# yet.

565

if repo.wvfs.exists(lfile):

571

if repo.wvfs.exists(lfile):

566

updatestandin(repo, lfile, fstandin)

572

updatestandin(repo, lfile, fstandin)

567

573

568

return match

574

return match

569

575

570

lfiles = listlfiles(repo)

576

lfiles = listlfiles(repo)

571

match._files = repo._subdirlfs(match.files(), lfiles)

577

match._files = repo._subdirlfs(match.files(), lfiles)

572

578

573

# Case 2: user calls commit with specified patterns: refresh

579

# Case 2: user calls commit with specified patterns: refresh

574

# any matching big files.

580

# any matching big files.

575

smatcher = composestandinmatcher(repo, match)

581

smatcher = composestandinmatcher(repo, match)

576

standins = repo.dirstate.walk(smatcher, [], False, False)

582

standins = repo.dirstate.walk(smatcher, [], False, False)

577

583

578

# No matching big files: get out of the way and pass control to

584

# No matching big files: get out of the way and pass control to

579

# the usual commit() method.

585

# the usual commit() method.

580

if not standins:

586

if not standins:

581

return match

587

return match

582

588

583

# Refresh all matching big files. It's possible that the

589

# Refresh all matching big files. It's possible that the

584

# commit will end up failing, in which case the big files will

590

# commit will end up failing, in which case the big files will

585

# stay refreshed. No harm done: the user modified them and

591

# stay refreshed. No harm done: the user modified them and

586

# asked to commit them, so sooner or later we're going to

592

# asked to commit them, so sooner or later we're going to

587

# refresh the standins. Might as well leave them refreshed.

593

# refresh the standins. Might as well leave them refreshed.

588

lfdirstate = openlfdirstate(ui, repo)

594

lfdirstate = openlfdirstate(ui, repo)

589

for fstandin in standins:

595

for fstandin in standins:

590

lfile = splitstandin(fstandin)

596

lfile = splitstandin(fstandin)

591

if lfdirstate[lfile] != 'r':

597

if lfdirstate[lfile] != 'r':

592

updatestandin(repo, lfile, fstandin)

598

updatestandin(repo, lfile, fstandin)

593

599

594

# Cook up a new matcher that only matches regular files or

600

# Cook up a new matcher that only matches regular files or

595

# standins corresponding to the big files requested by the

601

# standins corresponding to the big files requested by the

596

# user. Have to modify _files to prevent commit() from

602

# user. Have to modify _files to prevent commit() from

597

# complaining "not tracked" for big files.

603

# complaining "not tracked" for big files.

598

match = copy.copy(match)

604

match = copy.copy(match)

599

origmatchfn = match.matchfn

605

origmatchfn = match.matchfn

600

606

601

# Check both the list of largefiles and the list of

607

# Check both the list of largefiles and the list of

602

# standins because if a largefile was removed, it

608

# standins because if a largefile was removed, it

603

# won't be in the list of largefiles at this point

609

# won't be in the list of largefiles at this point

604

match._files += sorted(standins)

610

match._files += sorted(standins)

605

611

606

actualfiles = []

612

actualfiles = []

607

for f in match._files:

613

for f in match._files:

608

fstandin = standin(f)

614

fstandin = standin(f)

609

615

610

# For largefiles, only one of the normal and standin should be

616

# For largefiles, only one of the normal and standin should be

611

# committed (except if one of them is a remove). In the case of a

617

# committed (except if one of them is a remove). In the case of a

612

# standin removal, drop the normal file if it is unknown to dirstate.

618

# standin removal, drop the normal file if it is unknown to dirstate.

613

# Thus, skip plain largefile names but keep the standin.

619

# Thus, skip plain largefile names but keep the standin.

614

if f in lfiles or fstandin in standins:

620

if f in lfiles or fstandin in standins:

615

if repo.dirstate[fstandin] != 'r':

621

if repo.dirstate[fstandin] != 'r':

616

if repo.dirstate[f] != 'r':

622

if repo.dirstate[f] != 'r':

617

continue

623

continue

618

elif repo.dirstate[f] == '?':

624

elif repo.dirstate[f] == '?':

619

continue

625

continue

620

626

621

actualfiles.append(f)

627

actualfiles.append(f)

622

match._files = actualfiles

628

match._files = actualfiles

623

629

624

def matchfn(f):

630

def matchfn(f):

625

if origmatchfn(f):

631

if origmatchfn(f):

626

return f not in lfiles

632

return f not in lfiles

627

else:

633

else:

628

return f in standins

634

return f in standins

629

635

630

match.matchfn = matchfn

636

match.matchfn = matchfn

631

637

632

return match

638

return match

633

639

634

class automatedcommithook(object):

640

class automatedcommithook(object):

635

'''Stateful hook to update standins at the 1st commit of resuming

641

'''Stateful hook to update standins at the 1st commit of resuming

636

642

637

For efficiency, updating standins in the working directory should

643

For efficiency, updating standins in the working directory should

638

be avoided while automated committing (like rebase, transplant and

644

be avoided while automated committing (like rebase, transplant and

639

so on), because they should be updated before committing.

645

so on), because they should be updated before committing.

640

646

641

But the 1st commit of resuming automated committing (e.g. ``rebase

647

But the 1st commit of resuming automated committing (e.g. ``rebase

642

--continue``) should update them, because largefiles may be

648

--continue``) should update them, because largefiles may be

643

modified manually.

649

modified manually.

644

'''

650

'''

645

def __init__(self, resuming):

651

def __init__(self, resuming):

646

self.resuming = resuming

652

self.resuming = resuming

647

653

648

def __call__(self, repo, match):

654

def __call__(self, repo, match):

649

if self.resuming:

655

if self.resuming:

650

self.resuming = False # avoids updating at subsequent commits

656

self.resuming = False # avoids updating at subsequent commits

651

return updatestandinsbymatch(repo, match)

657

return updatestandinsbymatch(repo, match)

652

else:

658

else:

653

return match

659

return match

654

660

655

def getstatuswriter(ui, repo, forcibly=None):

661

def getstatuswriter(ui, repo, forcibly=None):

656

'''Return the function to write largefiles specific status out

662

'''Return the function to write largefiles specific status out

657

663

658

If ``forcibly`` is ``None``, this returns the last element of

664

If ``forcibly`` is ``None``, this returns the last element of

659

``repo._lfstatuswriters`` as "default" writer function.

665

``repo._lfstatuswriters`` as "default" writer function.

660

666

661

Otherwise, this returns the function to always write out (or

667

Otherwise, this returns the function to always write out (or

662

ignore if ``not forcibly``) status.

668

ignore if ``not forcibly``) status.

663

'''

669

'''

664

if forcibly is None and util.safehasattr(repo, '_largefilesenabled'):

670

if forcibly is None and util.safehasattr(repo, '_largefilesenabled'):

665

return repo._lfstatuswriters[-1]

671

return repo._lfstatuswriters[-1]

666

else:

672

else:

667

if forcibly:

673

if forcibly:

668

return ui.status # forcibly WRITE OUT

674

return ui.status # forcibly WRITE OUT

669

else:

675

else:

670

return lambda *msg, **opts: None # forcibly IGNORE

676

return lambda *msg, **opts: None # forcibly IGNORE

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # Copyright 2009-2010 Gregory P. Ward
             # Copyright 2009-2010 Intelerad Medical Systems Incorporated
             # Copyright 2010-2011 Fog Creek Software
             # Copyright 2010-2011 Unity Technologies
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             '''largefiles utility code: must not import other modules in this package.'''
             from __future__ import absolute_import
             import copy
             import hashlib
             import os
             import platform
             import stat
             from mercurial.i18n import _
             from mercurial import (
                 dirstate,
                 encoding,
                 error,
                 httpconnection,
                 match as matchmod,
                 node,
                 pycompat,
                 scmutil,
                 util,
                 vfs as vfsmod,
             )
             shortname = '.hglf'
             shortnameslash = shortname + '/'
             longname = 'largefiles'
             # -- Private worker functions ------------------------------------------
             def getminsize(ui, assumelfiles, opt, default=10):
                 lfsize = opt
                 if not lfsize and assumelfiles:
                     lfsize = ui.config(longname, 'minsize', default=default)
                 if lfsize:
                     try:
                         lfsize = float(lfsize)
                     except ValueError:
                         raise error.Abort(_('largefiles: size must be number (not %s)\n')
                                          % lfsize)
                 if lfsize is None:
                     raise error.Abort(_('minimum size for largefiles must be specified'))
                 return lfsize
             def link(src, dest):
                 """Try to create hardlink - if that fails, efficiently make a copy."""
                 util.makedirs(os.path.dirname(dest))
                 try:
                     util.oslink(src, dest)
                 except OSError:
                     # if hardlinks fail, fallback on atomic copy
                     with open(src, 'rb') as srcf:
                         with util.atomictempfile(dest) as dstf:
                             for chunk in util.filechunkiter(srcf):
                                 dstf.write(chunk)
                     os.chmod(dest, os.stat(src).st_mode)
             def usercachepath(ui, hash):
                 '''Return the correct location in the "global" largefiles cache for a file
                 with the given hash.
                 This cache is used for sharing of largefiles across repositories - both
                 to preserve download bandwidth and storage space.'''
                 return os.path.join(_usercachedir(ui), hash)
             def _usercachedir(ui):
                 '''Return the location of the "global" largefiles cache.'''
                 path = ui.configpath(longname, 'usercache', None)
                 if path:
                     return path
                 if pycompat.osname == 'nt':
                     appdata = encoding.environ.get('LOCALAPPDATA',\
                                     encoding.environ.get('APPDATA'))
                     if appdata:
                         return os.path.join(appdata, longname)
                 elif platform.system() == 'Darwin':
                     home = encoding.environ.get('HOME')
                     if home:
                         return os.path.join(home, 'Library', 'Caches', longname)
                 elif pycompat.osname == 'posix':
                     path = encoding.environ.get('XDG_CACHE_HOME')
                     if path:
                         return os.path.join(path, longname)
                     home = encoding.environ.get('HOME')
                     if home:
                         return os.path.join(home, '.cache', longname)
                 else:
                     raise error.Abort(_('unknown operating system: %s\n')
                                       % pycompat.osname)
                 raise error.Abort(_('unknown %s usercache location') % longname)
             def inusercache(ui, hash):
                 path = usercachepath(ui, hash)
                 return os.path.exists(path)
             def findfile(repo, hash):
                 '''Return store path of the largefile with the specified hash.
                 As a side effect, the file might be linked from user cache.
                 Return None if the file can't be found locally.'''
                 path, exists = findstorepath(repo, hash)
                 if exists:
                     repo.ui.note(_('found %s in store\n') % hash)
                     return path
                 elif inusercache(repo.ui, hash):
                     repo.ui.note(_('found %s in system cache\n') % hash)
                     path = storepath(repo, hash)
                     link(usercachepath(repo.ui, hash), path)
                     return path
                 return None
             class largefilesdirstate(dirstate.dirstate):
                 def __getitem__(self, key):
                     return super(largefilesdirstate, self).__getitem__(unixpath(key))
                 def normal(self, f):
                     return super(largefilesdirstate, self).normal(unixpath(f))
                 def remove(self, f):
                     return super(largefilesdirstate, self).remove(unixpath(f))
                 def add(self, f):
                     return super(largefilesdirstate, self).add(unixpath(f))
                 def drop(self, f):
                     return super(largefilesdirstate, self).drop(unixpath(f))
                 def forget(self, f):
                     return super(largefilesdirstate, self).forget(unixpath(f))
                 def normallookup(self, f):
                     return super(largefilesdirstate, self).normallookup(unixpath(f))
                 def _ignore(self, f):
                     return False
                 def write(self, tr=False):
                     # (1) disable PENDING mode always
                     #     (lfdirstate isn't yet managed as a part of the transaction)
                     # (2) avoid develwarn 'use dirstate.write with ....'
                     super(largefilesdirstate, self).write(None)
             def openlfdirstate(ui, repo, create=True):
                 '''
                 Return a dirstate object that tracks largefiles: i.e. its root is
                 the repo root, but it is saved in .hg/largefiles/dirstate.
                 '''
                 vfs = repo.vfs
                 lfstoredir = longname
                 opener = vfsmod.vfs(vfs.join(lfstoredir))
                 lfdirstate = largefilesdirstate(opener, ui, repo.root,
                                                  repo.dirstate._validate)
                 # If the largefiles dirstate does not exist, populate and create
                 # it. This ensures that we create it on the first meaningful
                 # largefiles operation in a new clone.
                 if create and not vfs.exists(vfs.join(lfstoredir, 'dirstate')):
                     matcher = getstandinmatcher(repo)
                     standins = repo.dirstate.walk(matcher, [], False, False)
                     if len(standins) > 0:
                         vfs.makedirs(lfstoredir)
                     for standin in standins:
                         lfile = splitstandin(standin)
                         lfdirstate.normallookup(lfile)
                 return lfdirstate
             def lfdirstatestatus(lfdirstate, repo):
                 pctx = repo['.']
                 match = matchmod.always(repo.root, repo.getcwd())
                 unsure, s = lfdirstate.status(match, [], False, False, False)
                 modified, clean = s.modified, s.clean
                 for lfile in unsure:
                     try:
                         fctx = pctx[standin(lfile)]
                     except LookupError:
                         fctx = None
                     if not fctx or fctx.data().strip() != hashfile(repo.wjoin(lfile)):
                         modified.append(lfile)
                     else:
                         clean.append(lfile)
                         lfdirstate.normal(lfile)
                 return s
             def listlfiles(repo, rev=None, matcher=None):
                 '''return a list of largefiles in the working copy or the
                 specified changeset'''
                 if matcher is None:
                     matcher = getstandinmatcher(repo)
                 # ignore unknown files in working directory
                 return [splitstandin(f)
                         for f in repo[rev].walk(matcher)
                         if rev is not None or repo.dirstate[f] != '?']
             def instore(repo, hash, forcelocal=False):
                 '''Return true if a largefile with the given hash exists in the store'''
                 return os.path.exists(storepath(repo, hash, forcelocal))
             def storepath(repo, hash, forcelocal=False):
                 '''Return the correct location in the repository largefiles store for a
                 file with the given hash.'''
                 if not forcelocal and repo.shared():
                     return repo.vfs.reljoin(repo.sharedpath, longname, hash)
                 return repo.vfs.join(longname, hash)
             def findstorepath(repo, hash):
                 '''Search through the local store path(s) to find the file for the given
                 hash.  If the file is not found, its path in the primary store is returned.
                 The return value is a tuple of (path, exists(path)).
                 '''
                 # For shared repos, the primary store is in the share source.  But for
                 # backward compatibility, force a lookup in the local store if it wasn't
                 # found in the share source.
                 path = storepath(repo, hash, False)
                 if instore(repo, hash):
                     return (path, True)
                 elif repo.shared() and instore(repo, hash, True):
                     return storepath(repo, hash, True), True
                 return (path, False)
             def copyfromcache(repo, hash, filename):
                 '''Copy the specified largefile from the repo or system cache to
                 filename in the repository. Return true on success or false if the
                 file was not found in either cache (which should not happened:
                 this is meant to be called only after ensuring that the needed
                 largefile exists in the cache).'''
                 wvfs = repo.wvfs
                 path = findfile(repo, hash)
                 if path is None:
                     return False
                 wvfs.makedirs(wvfs.dirname(wvfs.join(filename)))
                 # The write may fail before the file is fully written, but we
                 # don't use atomic writes in the working copy.
                 with open(path, 'rb') as srcfd:
                     with wvfs(filename, 'wb') as destfd:
                         gothash = copyandhash(
                             util.filechunkiter(srcfd), destfd)
                 if gothash != hash:
                     repo.ui.warn(_('%s: data corruption in %s with hash %s\n')
                                  % (filename, path, gothash))
                     wvfs.unlink(filename)
                     return False
                 return True
             def copytostore(repo, revorctx, file, uploaded=False):
                 wvfs = repo.wvfs
                 hash = readstandin(repo, file, revorctx)
                 if instore(repo, hash):
                     return
                 if wvfs.exists(file):
                     copytostoreabsolute(repo, wvfs.join(file), hash)
                 else:
                     repo.ui.warn(_("%s: largefile %s not available from local store\n") %
                                  (file, hash))
             def copyalltostore(repo, node):
                 '''Copy all largefiles in a given revision to the store'''
                 ctx = repo[node]
                 for filename in ctx.files():
                     realfile = splitstandin(filename)
                     if realfile is not None and filename in ctx.manifest():
                         copytostore(repo, ctx, realfile)
             def copytostoreabsolute(repo, file, hash):
                 if inusercache(repo.ui, hash):
                     link(usercachepath(repo.ui, hash), storepath(repo, hash))
                 else:
                     util.makedirs(os.path.dirname(storepath(repo, hash)))
                     with open(file, 'rb') as srcf:
                         with util.atomictempfile(storepath(repo, hash),
                                                  createmode=repo.store.createmode) as dstf:
                             for chunk in util.filechunkiter(srcf):
                                 dstf.write(chunk)
                     linktousercache(repo, hash)
             def linktousercache(repo, hash):
                 '''Link / copy the largefile with the specified hash from the store
                 to the cache.'''
                 path = usercachepath(repo.ui, hash)
                 link(storepath(repo, hash), path)
             def getstandinmatcher(repo, rmatcher=None):
                 '''Return a match object that applies rmatcher to the standin directory'''
                 wvfs = repo.wvfs
                 standindir = shortname
                 # no warnings about missing files or directories
                 badfn = lambda f, msg: None
                 if rmatcher and not rmatcher.always():
                     pats = [wvfs.join(standindir, pat) for pat in rmatcher.files()]
                     if not pats:
                         pats = [wvfs.join(standindir)]
                     match = scmutil.match(repo[None], pats, badfn=badfn)
                     # if pats is empty, it would incorrectly always match, so clear _always
                     match._always = False
                 else:
                     # no patterns: relative to repo root
                     match = scmutil.match(repo[None], [wvfs.join(standindir)], badfn=badfn)
                 return match
             def composestandinmatcher(repo, rmatcher):
                 '''Return a matcher that accepts standins corresponding to the
                 files accepted by rmatcher. Pass the list of files in the matcher
                 as the paths specified by the user.'''
                 smatcher = getstandinmatcher(repo, rmatcher)
                 isstandin = smatcher.matchfn
                 def composedmatchfn(f):
                     return isstandin(f) and rmatcher.matchfn(splitstandin(f))
                 smatcher.matchfn = composedmatchfn
                 return smatcher
             def standin(filename):
                 '''Return the repo-relative path to the standin for the specified big
                 file.'''
                 # Notes:
                 # 1) Some callers want an absolute path, but for instance addlargefiles
                 #    needs it repo-relative so it can be passed to repo[None].add().  So
                 #    leave it up to the caller to use repo.wjoin() to get an absolute path.
                 # 2) Join with '/' because that's what dirstate always uses, even on
                 #    Windows. Change existing separator to '/' first in case we are
                 #    passed filenames from an external source (like the command line).
                 return shortnameslash + util.pconvert(filename)
             def isstandin(filename):
                 '''Return true if filename is a big file standin. filename must be
                 in Mercurial's internal form (slash-separated).'''
                 return filename.startswith(shortnameslash)
             def splitstandin(filename):
                 # Split on / because that's what dirstate always uses, even on Windows.
                 # Change local separator to / first just in case we are passed filenames
                 # from an external source (like the command line).
                 bits = util.pconvert(filename).split('/', 1)
                 if len(bits) == 2 and bits[0] == shortname:
                     return bits[1]
                 else:
                     return None
             def updatestandin(repo, lfile, standin):
                 """Re-calculate hash value of lfile and write it into standin
                 This assumes that "lfutil.standin(lfile) == standin", for efficiency.
                 """
                 file = repo.wjoin(lfile)
                 if repo.wvfs.exists(lfile):
                     hash = hashfile(file)
                     executable = getexecutable(file)
                     writestandin(repo, standin, hash, executable)
                 else:
                     raise error.Abort(_('%s: file not found!') % lfile)
+            def readasstandin(fctx):
+                '''read hex hash from given filectx of standin file
+                This encapsulates how "standin" data is stored into storage layer.'''
+                return fctx.data().strip()
             def readstandin(repo, filename, node=None):
                 '''read hex hash from standin for filename at given node, or working
                 directory if no node is given'''
-                return repo[node][standin(filename)].data().strip()
+                return readasstandin(repo[node][standin(filename)])
             def writestandin(repo, standin, hash, executable):
                 '''write hash to <repo.root>/<standin>'''
                 repo.wwrite(standin, hash + '\n', executable and 'x' or '')
             def copyandhash(instream, outfile):
                 '''Read bytes from instream (iterable) and write them to outfile,
                 computing the SHA-1 hash of the data along the way. Return the hash.'''
                 hasher = hashlib.sha1('')
                 for data in instream:
                     hasher.update(data)
                     outfile.write(data)
                 return hasher.hexdigest()
             def hashfile(file):
                 if not os.path.exists(file):
                     return ''
                 with open(file, 'rb') as fd:
                     return hexsha1(fd)
             def getexecutable(filename):
                 mode = os.stat(filename).st_mode
                 return ((mode & stat.S_IXUSR) and
                         (mode & stat.S_IXGRP) and
                         (mode & stat.S_IXOTH))
             def urljoin(first, second, *arg):
                 def join(left, right):
                     if not left.endswith('/'):
                         left += '/'
                     if right.startswith('/'):
                         right = right[1:]
                     return left + right
                 url = join(first, second)
                 for a in arg:
                     url = join(url, a)
                 return url
             def hexsha1(fileobj):
                 """hexsha1 returns the hex-encoded sha1 sum of the data in the file-like
                 object data"""
                 h = hashlib.sha1()
                 for chunk in util.filechunkiter(fileobj):
                     h.update(chunk)
                 return h.hexdigest()
             def httpsendfile(ui, filename):
                 return httpconnection.httpsendfile(ui, filename, 'rb')
             def unixpath(path):
                 '''Return a version of path normalized for use with the lfdirstate.'''
                 return util.pconvert(os.path.normpath(path))
             def islfilesrepo(repo):
                 '''Return true if the repo is a largefile repo.'''
                 if ('largefiles' in repo.requirements and
                         any(shortnameslash in f[0] for f in repo.store.datafiles())):
                     return True
                 return any(openlfdirstate(repo.ui, repo, False))
             class storeprotonotcapable(Exception):
                 def __init__(self, storetypes):
                     self.storetypes = storetypes
             def getstandinsstate(repo):
                 standins = []
                 matcher = getstandinmatcher(repo)
                 for standin in repo.dirstate.walk(matcher, [], False, False):
                     lfile = splitstandin(standin)
                     try:
                         hash = readstandin(repo, lfile)
                     except IOError:
                         hash = None
                     standins.append((lfile, hash))
                 return standins
             def synclfdirstate(repo, lfdirstate, lfile, normallookup):
                 lfstandin = standin(lfile)
                 if lfstandin in repo.dirstate:
                     stat = repo.dirstate._map[lfstandin]
                     state, mtime = stat[0], stat[3]
                 else:
                     state, mtime = '?', -1
                 if state == 'n':
                     if (normallookup or mtime < 0 or
                         not repo.wvfs.exists(lfile)):
                         # state 'n' doesn't ensure 'clean' in this case
                         lfdirstate.normallookup(lfile)
                     else:
                         lfdirstate.normal(lfile)
                 elif state == 'm':
                     lfdirstate.normallookup(lfile)
                 elif state == 'r':
                     lfdirstate.remove(lfile)
                 elif state == 'a':
                     lfdirstate.add(lfile)
                 elif state == '?':
                     lfdirstate.drop(lfile)
             def markcommitted(orig, ctx, node):
                 repo = ctx.repo()
                 orig(node)
                 # ATTENTION: "ctx.files()" may differ from "repo[node].files()"
                 # because files coming from the 2nd parent are omitted in the latter.
                 #
                 # The former should be used to get targets of "synclfdirstate",
                 # because such files:
                 # - are marked as "a" by "patch.patch()" (e.g. via transplant), and
                 # - have to be marked as "n" after commit, but
                 # - aren't listed in "repo[node].files()"
                 lfdirstate = openlfdirstate(repo.ui, repo)
                 for f in ctx.files():
                     lfile = splitstandin(f)
                     if lfile is not None:
                         synclfdirstate(repo, lfdirstate, lfile, False)
                 lfdirstate.write()
                 # As part of committing, copy all of the largefiles into the cache.
                 #
                 # Using "node" instead of "ctx" implies additional "repo[node]"
                 # lookup while copyalltostore(), but can omit redundant check for
                 # files comming from the 2nd parent, which should exist in store
                 # at merging.
                 copyalltostore(repo, node)
             def getlfilestoupdate(oldstandins, newstandins):
                 changedstandins = set(oldstandins).symmetric_difference(set(newstandins))
                 filelist = []
                 for f in changedstandins:
                     if f[0] not in filelist:
                         filelist.append(f[0])
                 return filelist
             def getlfilestoupload(repo, missing, addfunc):
                 for i, n in enumerate(missing):
                     repo.ui.progress(_('finding outgoing largefiles'), i,
                         unit=_('revisions'), total=len(missing))
                     parents = [p for p in repo[n].parents() if p != node.nullid]
                     oldlfstatus = repo.lfstatus
                     repo.lfstatus = False
                     try:
                         ctx = repo[n]
                     finally:
                         repo.lfstatus = oldlfstatus
                     files = set(ctx.files())
                     if len(parents) == 2:
                         mc = ctx.manifest()
                         mp1 = ctx.parents()[0].manifest()
                         mp2 = ctx.parents()[1].manifest()
                         for f in mp1:
                             if f not in mc:
                                 files.add(f)
                         for f in mp2:
                             if f not in mc:
                                 files.add(f)
                         for f in mc:
                             if mc[f] != mp1.get(f, None) or mc[f] != mp2.get(f, None):
                                 files.add(f)
                     for fn in files:
                         if isstandin(fn) and fn in ctx:
                             addfunc(fn, ctx[fn].data().strip())
                 repo.ui.progress(_('finding outgoing largefiles'), None)
             def updatestandinsbymatch(repo, match):
                 '''Update standins in the working directory according to specified match
                 This returns (possibly modified) ``match`` object to be used for
                 subsequent commit process.
                 '''
                 ui = repo.ui
                 # Case 1: user calls commit with no specific files or
                 # include/exclude patterns: refresh and commit all files that
                 # are "dirty".
                 if match is None or match.always():
                     # Spend a bit of time here to get a list of files we know
                     # are modified so we can compare only against those.
                     # It can cost a lot of time (several seconds)
                     # otherwise to update all standins if the largefiles are
                     # large.
                     lfdirstate = openlfdirstate(ui, repo)
                     dirtymatch = matchmod.always(repo.root, repo.getcwd())
                     unsure, s = lfdirstate.status(dirtymatch, [], False, False,
                                                   False)
                     modifiedfiles = unsure + s.modified + s.added + s.removed
                     lfiles = listlfiles(repo)
                     # this only loops through largefiles that exist (not
                     # removed/renamed)
                     for lfile in lfiles:
                         if lfile in modifiedfiles:
                             fstandin = standin(lfile)
                             if repo.wvfs.exists(fstandin):
                                 # this handles the case where a rebase is being
                                 # performed and the working copy is not updated
                                 # yet.
                                 if repo.wvfs.exists(lfile):
                                     updatestandin(repo, lfile, fstandin)
                     return match
                 lfiles = listlfiles(repo)
                 match._files = repo._subdirlfs(match.files(), lfiles)
                 # Case 2: user calls commit with specified patterns: refresh
                 # any matching big files.
                 smatcher = composestandinmatcher(repo, match)
                 standins = repo.dirstate.walk(smatcher, [], False, False)
                 # No matching big files: get out of the way and pass control to
                 # the usual commit() method.
                 if not standins:
                     return match
                 # Refresh all matching big files.  It's possible that the
                 # commit will end up failing, in which case the big files will
                 # stay refreshed.  No harm done: the user modified them and
                 # asked to commit them, so sooner or later we're going to
                 # refresh the standins.  Might as well leave them refreshed.
                 lfdirstate = openlfdirstate(ui, repo)
                 for fstandin in standins:
                     lfile = splitstandin(fstandin)
                     if lfdirstate[lfile] != 'r':
                         updatestandin(repo, lfile, fstandin)
                 # Cook up a new matcher that only matches regular files or
                 # standins corresponding to the big files requested by the
                 # user.  Have to modify _files to prevent commit() from
                 # complaining "not tracked" for big files.
                 match = copy.copy(match)
                 origmatchfn = match.matchfn
                 # Check both the list of largefiles and the list of
                 # standins because if a largefile was removed, it
                 # won't be in the list of largefiles at this point
                 match._files += sorted(standins)
                 actualfiles = []
                 for f in match._files:
                     fstandin = standin(f)
                     # For largefiles, only one of the normal and standin should be
                     # committed (except if one of them is a remove).  In the case of a
                     # standin removal, drop the normal file if it is unknown to dirstate.
                     # Thus, skip plain largefile names but keep the standin.
                     if f in lfiles or fstandin in standins:
                         if repo.dirstate[fstandin] != 'r':
                             if repo.dirstate[f] != 'r':
                                 continue
                         elif repo.dirstate[f] == '?':
                             continue
                     actualfiles.append(f)
                 match._files = actualfiles
                 def matchfn(f):
                     if origmatchfn(f):
                         return f not in lfiles
                     else:
                         return f in standins
                 match.matchfn = matchfn
                 return match
             class automatedcommithook(object):
                 '''Stateful hook to update standins at the 1st commit of resuming
                 For efficiency, updating standins in the working directory should
                 be avoided while automated committing (like rebase, transplant and
                 so on), because they should be updated before committing.
                 But the 1st commit of resuming automated committing (e.g. ``rebase
                 --continue``) should update them, because largefiles may be
                 modified manually.
                 '''
                 def __init__(self, resuming):
                     self.resuming = resuming
                 def __call__(self, repo, match):
                     if self.resuming:
                         self.resuming = False # avoids updating at subsequent commits
                         return updatestandinsbymatch(repo, match)
                     else:
                         return match
             def getstatuswriter(ui, repo, forcibly=None):
                 '''Return the function to write largefiles specific status out
                 If ``forcibly`` is ``None``, this returns the last element of
                 ``repo._lfstatuswriters`` as "default" writer function.
                 Otherwise, this returns the function to always write out (or
                 ignore if ``not forcibly``) status.
                 '''
                 if forcibly is None and util.safehasattr(repo, '_largefilesenabled'):
                     return repo._lfstatuswriters[-1]
                 else:
                     if forcibly:
                         return ui.status # forcibly WRITE OUT
                     else:
                         return lambda *msg, **opts: None # forcibly IGNORE