upstream/mercurial-mirror Commit - r15699:84e55467

1

2

3

4

5

#

5

#

6

# This software may be used and distributed according to the terms of the

6

# This software may be used and distributed according to the terms of the

7

# GNU General Public License version 2 or any later version.

7

# GNU General Public License version 2 or any later version.

8

9

'''largefiles utility code: must not import other modules in this package.'''

9

'''largefiles utility code: must not import other modules in this package.'''

10

11

import os

11

import os

12

import errno

12

import errno

13

import platform

13

import platform

14

import shutil

14

import shutil

15

import stat

15

import stat

16

import tempfile

16

import tempfile

17

18

from mercurial import dirstate, httpconnection, match as match_, util, scmutil

18

from mercurial import dirstate, httpconnection, match as match_, util, scmutil

19

from mercurial.i18n import _

19

from mercurial.i18n import _

20

21

shortname = '.hglf'

21

shortname = '.hglf'

22

longname = 'largefiles'

22

longname = 'largefiles'

23

24

25

# -- Portability wrappers ----------------------------------------------

25

# -- Portability wrappers ----------------------------------------------

26

27

def dirstate_walk(dirstate, matcher, unknown=False, ignored=False):

27

def dirstate_walk(dirstate, matcher, unknown=False, ignored=False):

28

return dirstate.walk(matcher, [], unknown, ignored)

28

return dirstate.walk(matcher, [], unknown, ignored)

29

30

def repo_add(repo, list):

30

def repo_add(repo, list):

31

add = repo[None].add

31

add = repo[None].add

32

return add(list)

32

return add(list)

33

34

def repo_remove(repo, list, unlink=False):

34

def repo_remove(repo, list, unlink=False):

35

def remove(list, unlink):

35

def remove(list, unlink):

36

wlock = repo.wlock()

36

wlock = repo.wlock()

37

try:

37

try:

38

if unlink:

38

if unlink:

39

for f in list:

39

for f in list:

40

try:

40

try:

41

util.unlinkpath(repo.wjoin(f))

41

util.unlinkpath(repo.wjoin(f))

42

except OSError, inst:

42

except OSError, inst:

43

if inst.errno != errno.ENOENT:

43

if inst.errno != errno.ENOENT:

44

raise

44

raise

45

repo[None].forget(list)

45

repo[None].forget(list)

46

finally:

46

finally:

47

wlock.release()

47

wlock.release()

48

return remove(list, unlink=unlink)

48

return remove(list, unlink=unlink)

49

50

def repo_forget(repo, list):

50

def repo_forget(repo, list):

51

forget = repo[None].forget

51

forget = repo[None].forget

52

return forget(list)

52

return forget(list)

53

54

def findoutgoing(repo, remote, force):

54

def findoutgoing(repo, remote, force):

55

from mercurial import discovery

55

from mercurial import discovery

56

common, _anyinc, _heads = discovery.findcommonincoming(repo,

56

common, _anyinc, _heads = discovery.findcommonincoming(repo,

57

remote, force=force)

57

remote, force=force)

58

return repo.changelog.findmissing(common)

58

return repo.changelog.findmissing(common)

59

60

# -- Private worker functions ------------------------------------------

60

# -- Private worker functions ------------------------------------------

61

62

def getminsize(ui, assumelfiles, opt, default=10):

62

def getminsize(ui, assumelfiles, opt, default=10):

63

lfsize = opt

63

lfsize = opt

64

if not lfsize and assumelfiles:

64

if not lfsize and assumelfiles:

65

lfsize = ui.config(longname, 'minsize', default=default)

65

lfsize = ui.config(longname, 'minsize', default=default)

66

if lfsize:

66

if lfsize:

67

try:

67

try:

68

lfsize = float(lfsize)

68

lfsize = float(lfsize)

69

except ValueError:

69

except ValueError:

70

raise util.Abort(_('largefiles: size must be number (not %s)\n')

70

raise util.Abort(_('largefiles: size must be number (not %s)\n')

71

% lfsize)

71

% lfsize)

72

if lfsize is None:

72

if lfsize is None:

73

raise util.Abort(_('minimum size for largefiles must be specified'))

73

raise util.Abort(_('minimum size for largefiles must be specified'))

74

return lfsize

74

return lfsize

75

76

def link(src, dest):

76

def link(src, dest):

77

try:

77

try:

78

util.oslink(src, dest)

78

util.oslink(src, dest)

79

except OSError:

79

except OSError:

80

# if hardlinks fail, fallback on atomic copy

80

# if hardlinks fail, fallback on atomic copy

81

dst = util.atomictempfile(dest)

81

dst = util.atomictempfile(dest)

82

for chunk in util.filechunkiter(open(src)):

82

for chunk in util.filechunkiter(open(src, 'rb')):

83

dst.write(chunk)

83

dst.write(chunk)

84

dst.close()

84

dst.close()

85

os.chmod(dest, os.stat(src).st_mode)

85

os.chmod(dest, os.stat(src).st_mode)

86

87

def usercachepath(ui, hash):

87

def usercachepath(ui, hash):

88

path = ui.configpath(longname, 'usercache', None)

88

path = ui.configpath(longname, 'usercache', None)

89

if path:

89

if path:

90

path = os.path.join(path, hash)

90

path = os.path.join(path, hash)

91

else:

91

else:

92

if os.name == 'nt':

92

if os.name == 'nt':

93

appdata = os.getenv('LOCALAPPDATA', os.getenv('APPDATA'))

93

appdata = os.getenv('LOCALAPPDATA', os.getenv('APPDATA'))

94

if appdata:

94

if appdata:

95

path = os.path.join(appdata, longname, hash)

95

path = os.path.join(appdata, longname, hash)

96

elif platform.system() == 'Darwin':

96

elif platform.system() == 'Darwin':

97

home = os.getenv('HOME')

97

home = os.getenv('HOME')

98

if home:

98

if home:

99

path = os.path.join(home, 'Library', 'Caches',

99

path = os.path.join(home, 'Library', 'Caches',

100

longname, hash)

100

longname, hash)

101

elif os.name == 'posix':

101

elif os.name == 'posix':

102

path = os.getenv('XDG_CACHE_HOME')

102

path = os.getenv('XDG_CACHE_HOME')

103

if path:

103

if path:

104

path = os.path.join(path, longname, hash)

104

path = os.path.join(path, longname, hash)

105

else:

105

else:

106

home = os.getenv('HOME')

106

home = os.getenv('HOME')

107

if home:

107

if home:

108

path = os.path.join(home, '.cache', longname, hash)

108

path = os.path.join(home, '.cache', longname, hash)

109

else:

109

else:

110

raise util.Abort(_('unknown operating system: %s\n') % os.name)

110

raise util.Abort(_('unknown operating system: %s\n') % os.name)

111

return path

111

return path

112

113

def inusercache(ui, hash):

113

def inusercache(ui, hash):

114

path = usercachepath(ui, hash)

114

path = usercachepath(ui, hash)

115

return path and os.path.exists(path)

115

return path and os.path.exists(path)

116

117

def findfile(repo, hash):

117

def findfile(repo, hash):

118

if instore(repo, hash):

118

if instore(repo, hash):

119

repo.ui.note(_('Found %s in store\n') % hash)

119

repo.ui.note(_('Found %s in store\n') % hash)

120

elif inusercache(repo.ui, hash):

120

elif inusercache(repo.ui, hash):

121

repo.ui.note(_('Found %s in system cache\n') % hash)

121

repo.ui.note(_('Found %s in system cache\n') % hash)

122

path = storepath(repo, hash)

122

path = storepath(repo, hash)

123

util.makedirs(os.path.dirname(path))

123

util.makedirs(os.path.dirname(path))

124

link(usercachepath(repo.ui, hash), path)

124

link(usercachepath(repo.ui, hash), path)

125

else:

125

else:

126

return None

126

return None

127

return storepath(repo, hash)

127

return storepath(repo, hash)

128

129

class largefiles_dirstate(dirstate.dirstate):

129

class largefiles_dirstate(dirstate.dirstate):

130

def __getitem__(self, key):

130

def __getitem__(self, key):

131

return super(largefiles_dirstate, self).__getitem__(unixpath(key))

131

return super(largefiles_dirstate, self).__getitem__(unixpath(key))

132

def normal(self, f):

132

def normal(self, f):

133

return super(largefiles_dirstate, self).normal(unixpath(f))

133

return super(largefiles_dirstate, self).normal(unixpath(f))

134

def remove(self, f):

134

def remove(self, f):

135

return super(largefiles_dirstate, self).remove(unixpath(f))

135

return super(largefiles_dirstate, self).remove(unixpath(f))

136

def add(self, f):

136

def add(self, f):

137

return super(largefiles_dirstate, self).add(unixpath(f))

137

return super(largefiles_dirstate, self).add(unixpath(f))

138

def drop(self, f):

138

def drop(self, f):

139

return super(largefiles_dirstate, self).drop(unixpath(f))

139

return super(largefiles_dirstate, self).drop(unixpath(f))

140

def forget(self, f):

140

def forget(self, f):

141

return super(largefiles_dirstate, self).forget(unixpath(f))

141

return super(largefiles_dirstate, self).forget(unixpath(f))

142

143

def openlfdirstate(ui, repo):

143

def openlfdirstate(ui, repo):

144

'''

144

'''

145

Return a dirstate object that tracks largefiles: i.e. its root is

145

Return a dirstate object that tracks largefiles: i.e. its root is

146

the repo root, but it is saved in .hg/largefiles/dirstate.

146

the repo root, but it is saved in .hg/largefiles/dirstate.

147

'''

147

'''

148

admin = repo.join(longname)

148

admin = repo.join(longname)

149

opener = scmutil.opener(admin)

149

opener = scmutil.opener(admin)

150

lfdirstate = largefiles_dirstate(opener, ui, repo.root,

150

lfdirstate = largefiles_dirstate(opener, ui, repo.root,

151

repo.dirstate._validate)

151

repo.dirstate._validate)

152

153

# If the largefiles dirstate does not exist, populate and create

153

# If the largefiles dirstate does not exist, populate and create

154

# it. This ensures that we create it on the first meaningful

154

# it. This ensures that we create it on the first meaningful

155

# largefiles operation in a new clone. It also gives us an easy

155

# largefiles operation in a new clone. It also gives us an easy

156

# way to forcibly rebuild largefiles state:

156

# way to forcibly rebuild largefiles state:

157

# rm .hg/largefiles/dirstate && hg status

157

# rm .hg/largefiles/dirstate && hg status

158

# Or even, if things are really messed up:

158

# Or even, if things are really messed up:

159

# rm -rf .hg/largefiles && hg status

159

# rm -rf .hg/largefiles && hg status

160

if not os.path.exists(os.path.join(admin, 'dirstate')):

160

if not os.path.exists(os.path.join(admin, 'dirstate')):

161

util.makedirs(admin)

161

util.makedirs(admin)

162

matcher = getstandinmatcher(repo)

162

matcher = getstandinmatcher(repo)

163

for standin in dirstate_walk(repo.dirstate, matcher):

163

for standin in dirstate_walk(repo.dirstate, matcher):

164

lfile = splitstandin(standin)

164

lfile = splitstandin(standin)

165

hash = readstandin(repo, lfile)

165

hash = readstandin(repo, lfile)

166

lfdirstate.normallookup(lfile)

166

lfdirstate.normallookup(lfile)

167

try:

167

try:

168

if hash == hashfile(repo.wjoin(lfile)):

168

if hash == hashfile(repo.wjoin(lfile)):

169

lfdirstate.normal(lfile)

169

lfdirstate.normal(lfile)

170

except OSError, err:

170

except OSError, err:

171

if err.errno != errno.ENOENT:

171

if err.errno != errno.ENOENT:

172

raise

172

raise

173

174

lfdirstate.write()

174

lfdirstate.write()

175

176

return lfdirstate

176

return lfdirstate

177

178

def lfdirstate_status(lfdirstate, repo, rev):

178

def lfdirstate_status(lfdirstate, repo, rev):

179

wlock = repo.wlock()

179

wlock = repo.wlock()

180

try:

180

try:

181

match = match_.always(repo.root, repo.getcwd())

181

match = match_.always(repo.root, repo.getcwd())

182

s = lfdirstate.status(match, [], False, False, False)

182

s = lfdirstate.status(match, [], False, False, False)

183

unsure, modified, added, removed, missing, unknown, ignored, clean = s

183

unsure, modified, added, removed, missing, unknown, ignored, clean = s

184

for lfile in unsure:

184

for lfile in unsure:

185

if repo[rev][standin(lfile)].data().strip() != \

185

if repo[rev][standin(lfile)].data().strip() != \

186

hashfile(repo.wjoin(lfile)):

186

hashfile(repo.wjoin(lfile)):

187

modified.append(lfile)

187

modified.append(lfile)

188

else:

188

else:

189

clean.append(lfile)

189

clean.append(lfile)

190

lfdirstate.normal(lfile)

190

lfdirstate.normal(lfile)

191

lfdirstate.write()

191

lfdirstate.write()

192

finally:

192

finally:

193

wlock.release()

193

wlock.release()

194

return (modified, added, removed, missing, unknown, ignored, clean)

194

return (modified, added, removed, missing, unknown, ignored, clean)

195

196

def listlfiles(repo, rev=None, matcher=None):

196

def listlfiles(repo, rev=None, matcher=None):

197

'''return a list of largefiles in the working copy or the

197

'''return a list of largefiles in the working copy or the

198

specified changeset'''

198

specified changeset'''

199

200

if matcher is None:

200

if matcher is None:

201

matcher = getstandinmatcher(repo)

201

matcher = getstandinmatcher(repo)

202

203

# ignore unknown files in working directory

203

# ignore unknown files in working directory

204

return [splitstandin(f)

204

return [splitstandin(f)

205

for f in repo[rev].walk(matcher)

205

for f in repo[rev].walk(matcher)

206

if rev is not None or repo.dirstate[f] != '?']

206

if rev is not None or repo.dirstate[f] != '?']

207

208

def instore(repo, hash):

208

def instore(repo, hash):

209

return os.path.exists(storepath(repo, hash))

209

return os.path.exists(storepath(repo, hash))

210

211

def storepath(repo, hash):

211

def storepath(repo, hash):

212

return repo.join(os.path.join(longname, hash))

212

return repo.join(os.path.join(longname, hash))

213

214

def copyfromcache(repo, hash, filename):

214

def copyfromcache(repo, hash, filename):

215

'''Copy the specified largefile from the repo or system cache to

215

'''Copy the specified largefile from the repo or system cache to

216

filename in the repository. Return true on success or false if the

216

filename in the repository. Return true on success or false if the

217

file was not found in either cache (which should not happened:

217

file was not found in either cache (which should not happened:

218

this is meant to be called only after ensuring that the needed

218

this is meant to be called only after ensuring that the needed

219

largefile exists in the cache).'''

219

largefile exists in the cache).'''

220

path = findfile(repo, hash)

220

path = findfile(repo, hash)

221

if path is None:

221

if path is None:

222

return False

222

return False

223

util.makedirs(os.path.dirname(repo.wjoin(filename)))

223

util.makedirs(os.path.dirname(repo.wjoin(filename)))

224

# The write may fail before the file is fully written, but we

224

# The write may fail before the file is fully written, but we

225

# don't use atomic writes in the working copy.

225

# don't use atomic writes in the working copy.

226

shutil.copy(path, repo.wjoin(filename))

226

shutil.copy(path, repo.wjoin(filename))

227

return True

227

return True

228

229

def copytostore(repo, rev, file, uploaded=False):

229

def copytostore(repo, rev, file, uploaded=False):

230

hash = readstandin(repo, file)

230

hash = readstandin(repo, file)

231

if instore(repo, hash):

231

if instore(repo, hash):

232

return

232

return

233

copytostoreabsolute(repo, repo.wjoin(file), hash)

233

copytostoreabsolute(repo, repo.wjoin(file), hash)

234

235

def copytostoreabsolute(repo, file, hash):

235

def copytostoreabsolute(repo, file, hash):

236

util.makedirs(os.path.dirname(storepath(repo, hash)))

236

util.makedirs(os.path.dirname(storepath(repo, hash)))

237

if inusercache(repo.ui, hash):

237

if inusercache(repo.ui, hash):

238

link(usercachepath(repo.ui, hash), storepath(repo, hash))

238

link(usercachepath(repo.ui, hash), storepath(repo, hash))

239

else:

239

else:

240

dst = util.atomictempfile(storepath(repo, hash))

240

dst = util.atomictempfile(storepath(repo, hash))

241

for chunk in util.filechunkiter(open(file)):

241

for chunk in util.filechunkiter(open(file, 'rb')):

242

dst.write(chunk)

242

dst.write(chunk)

243

dst.close()

243

dst.close()

244

util.copymode(file, storepath(repo, hash))

244

util.copymode(file, storepath(repo, hash))

245

linktousercache(repo, hash)

245

linktousercache(repo, hash)

246

247

def linktousercache(repo, hash):

247

def linktousercache(repo, hash):

248

path = usercachepath(repo.ui, hash)

248

path = usercachepath(repo.ui, hash)

249

if path:

249

if path:

250

util.makedirs(os.path.dirname(path))

250

util.makedirs(os.path.dirname(path))

251

link(storepath(repo, hash), path)

251

link(storepath(repo, hash), path)

252

253

def getstandinmatcher(repo, pats=[], opts={}):

253

def getstandinmatcher(repo, pats=[], opts={}):

254

'''Return a match object that applies pats to the standin directory'''

254

'''Return a match object that applies pats to the standin directory'''

255

standindir = repo.pathto(shortname)

255

standindir = repo.pathto(shortname)

256

if pats:

256

if pats:

257

# patterns supplied: search standin directory relative to current dir

257

# patterns supplied: search standin directory relative to current dir

258

cwd = repo.getcwd()

258

cwd = repo.getcwd()

259

if os.path.isabs(cwd):

259

if os.path.isabs(cwd):

260

# cwd is an absolute path for hg -R <reponame>

260

# cwd is an absolute path for hg -R <reponame>

261

# work relative to the repository root in this case

261

# work relative to the repository root in this case

262

cwd = ''

262

cwd = ''

263

pats = [os.path.join(standindir, cwd, pat) for pat in pats]

263

pats = [os.path.join(standindir, cwd, pat) for pat in pats]

264

elif os.path.isdir(standindir):

264

elif os.path.isdir(standindir):

265

# no patterns: relative to repo root

265

# no patterns: relative to repo root

266

pats = [standindir]

266

pats = [standindir]

267

else:

267

else:

268

# no patterns and no standin dir: return matcher that matches nothing

268

# no patterns and no standin dir: return matcher that matches nothing

269

match = match_.match(repo.root, None, [], exact=True)

269

match = match_.match(repo.root, None, [], exact=True)

270

match.matchfn = lambda f: False

270

match.matchfn = lambda f: False

271

return match

271

return match

272

return getmatcher(repo, pats, opts, showbad=False)

272

return getmatcher(repo, pats, opts, showbad=False)

273

274

def getmatcher(repo, pats=[], opts={}, showbad=True):

274

def getmatcher(repo, pats=[], opts={}, showbad=True):

275

'''Wrapper around scmutil.match() that adds showbad: if false,

275

'''Wrapper around scmutil.match() that adds showbad: if false,

276

neuter the match object's bad() method so it does not print any

276

neuter the match object's bad() method so it does not print any

277

warnings about missing files or directories.'''

277

warnings about missing files or directories.'''

278

match = scmutil.match(repo[None], pats, opts)

278

match = scmutil.match(repo[None], pats, opts)

279

280

if not showbad:

280

if not showbad:

281

match.bad = lambda f, msg: None

281

match.bad = lambda f, msg: None

282

return match

282

return match

283

284

def composestandinmatcher(repo, rmatcher):

284

def composestandinmatcher(repo, rmatcher):

285

'''Return a matcher that accepts standins corresponding to the

285

'''Return a matcher that accepts standins corresponding to the

286

files accepted by rmatcher. Pass the list of files in the matcher

286

files accepted by rmatcher. Pass the list of files in the matcher

287

as the paths specified by the user.'''

287

as the paths specified by the user.'''

288

smatcher = getstandinmatcher(repo, rmatcher.files())

288

smatcher = getstandinmatcher(repo, rmatcher.files())

289

isstandin = smatcher.matchfn

289

isstandin = smatcher.matchfn

290

def composed_matchfn(f):

290

def composed_matchfn(f):

291

return isstandin(f) and rmatcher.matchfn(splitstandin(f))

291

return isstandin(f) and rmatcher.matchfn(splitstandin(f))

292

smatcher.matchfn = composed_matchfn

292

smatcher.matchfn = composed_matchfn

293

294

return smatcher

294

return smatcher

295

296

def standin(filename):

296

def standin(filename):

297

'''Return the repo-relative path to the standin for the specified big

297

'''Return the repo-relative path to the standin for the specified big

298

file.'''

298

file.'''

299

# Notes:

299

# Notes:

300

# 1) Most callers want an absolute path, but _create_standin() needs

300

# 1) Most callers want an absolute path, but _create_standin() needs

301

# it repo-relative so lfadd() can pass it to repo_add(). So leave

301

# it repo-relative so lfadd() can pass it to repo_add(). So leave

302

# it up to the caller to use repo.wjoin() to get an absolute path.

302

# it up to the caller to use repo.wjoin() to get an absolute path.

303

# 2) Join with '/' because that's what dirstate always uses, even on

303

# 2) Join with '/' because that's what dirstate always uses, even on

304

# Windows. Change existing separator to '/' first in case we are

304

# Windows. Change existing separator to '/' first in case we are

305

# passed filenames from an external source (like the command line).

305

# passed filenames from an external source (like the command line).

306

return shortname + '/' + filename.replace(os.sep, '/')

306

return shortname + '/' + filename.replace(os.sep, '/')

307

308

def isstandin(filename):

308

def isstandin(filename):

309

'''Return true if filename is a big file standin. filename must be

309

'''Return true if filename is a big file standin. filename must be

310

in Mercurial's internal form (slash-separated).'''

310

in Mercurial's internal form (slash-separated).'''

311

return filename.startswith(shortname + '/')

311

return filename.startswith(shortname + '/')

312

313

def splitstandin(filename):

313

def splitstandin(filename):

314

# Split on / because that's what dirstate always uses, even on Windows.

314

# Split on / because that's what dirstate always uses, even on Windows.

315

# Change local separator to / first just in case we are passed filenames

315

# Change local separator to / first just in case we are passed filenames

316

# from an external source (like the command line).

316

# from an external source (like the command line).

317

bits = filename.replace(os.sep, '/').split('/', 1)

317

bits = filename.replace(os.sep, '/').split('/', 1)

318

if len(bits) == 2 and bits[0] == shortname:

318

if len(bits) == 2 and bits[0] == shortname:

319

return bits[1]

319

return bits[1]

320

else:

320

else:

321

return None

321

return None

322

323

def updatestandin(repo, standin):

323

def updatestandin(repo, standin):

324

file = repo.wjoin(splitstandin(standin))

324

file = repo.wjoin(splitstandin(standin))

325

if os.path.exists(file):

325

if os.path.exists(file):

326

hash = hashfile(file)

326

hash = hashfile(file)

327

executable = getexecutable(file)

327

executable = getexecutable(file)

328

writestandin(repo, standin, hash, executable)

328

writestandin(repo, standin, hash, executable)

329

330

def readstandin(repo, filename, node=None):

330

def readstandin(repo, filename, node=None):

331

'''read hex hash from standin for filename at given node, or working

331

'''read hex hash from standin for filename at given node, or working

332

directory if no node is given'''

332

directory if no node is given'''

333

return repo[node][standin(filename)].data().strip()

333

return repo[node][standin(filename)].data().strip()

334

335

def writestandin(repo, standin, hash, executable):

335

def writestandin(repo, standin, hash, executable):

336

'''write hash to <repo.root>/<standin>'''

336

'''write hash to <repo.root>/<standin>'''

337

writehash(hash, repo.wjoin(standin), executable)

337

writehash(hash, repo.wjoin(standin), executable)

338

339

def copyandhash(instream, outfile):

339

def copyandhash(instream, outfile):

340

'''Read bytes from instream (iterable) and write them to outfile,

340

'''Read bytes from instream (iterable) and write them to outfile,

341

computing the SHA-1 hash of the data along the way. Close outfile

341

computing the SHA-1 hash of the data along the way. Close outfile

342

when done and return the binary hash.'''

342

when done and return the binary hash.'''

343

hasher = util.sha1('')

343

hasher = util.sha1('')

344

for data in instream:

344

for data in instream:

345

hasher.update(data)

345

hasher.update(data)

346

outfile.write(data)

346

outfile.write(data)

347

348

# Blecch: closing a file that somebody else opened is rude and

348

# Blecch: closing a file that somebody else opened is rude and

349

# wrong. But it's so darn convenient and practical! After all,

349

# wrong. But it's so darn convenient and practical! After all,

350

# outfile was opened just to copy and hash.

350

# outfile was opened just to copy and hash.

351

outfile.close()

351

outfile.close()

352

353

return hasher.digest()

353

return hasher.digest()

354

355

def hashrepofile(repo, file):

355

def hashrepofile(repo, file):

356

return hashfile(repo.wjoin(file))

356

return hashfile(repo.wjoin(file))

357

358

def hashfile(file):

358

def hashfile(file):

359

if not os.path.exists(file):

359

if not os.path.exists(file):

360

return ''

360

return ''

361

hasher = util.sha1('')

361

hasher = util.sha1('')

362

fd = open(file, 'rb')

362

fd = open(file, 'rb')

363

for data in blockstream(fd):

363

for data in blockstream(fd):

364

hasher.update(data)

364

hasher.update(data)

365

fd.close()

365

fd.close()

366

return hasher.hexdigest()

366

return hasher.hexdigest()

367

368

class limitreader(object):

368

class limitreader(object):

369

def __init__(self, f, limit):

369

def __init__(self, f, limit):

370

self.f = f

370

self.f = f

371

self.limit = limit

371

self.limit = limit

372

373

def read(self, length):

373

def read(self, length):

374

if self.limit == 0:

374

if self.limit == 0:

375

return ''

375

return ''

376

length = length > self.limit and self.limit or length

376

length = length > self.limit and self.limit or length

377

self.limit -= length

377

self.limit -= length

378

return self.f.read(length)

378

return self.f.read(length)

379

380

def close(self):

380

def close(self):

381

pass

381

pass

382

383

def blockstream(infile, blocksize=128 * 1024):

383

def blockstream(infile, blocksize=128 * 1024):

384

"""Generator that yields blocks of data from infile and closes infile."""

384

"""Generator that yields blocks of data from infile and closes infile."""

385

while True:

385

while True:

386

data = infile.read(blocksize)

386

data = infile.read(blocksize)

387

if not data:

387

if not data:

388

break

388

break

389

yield data

389

yield data

390

# same blecch as copyandhash() above

390

# same blecch as copyandhash() above

391

infile.close()

391

infile.close()

392

393

def readhash(filename):

393

def readhash(filename):

394

rfile = open(filename, 'rb')

394

rfile = open(filename, 'rb')

395

hash = rfile.read(40)

395

hash = rfile.read(40)

396

rfile.close()

396

rfile.close()

397

if len(hash) < 40:

397

if len(hash) < 40:

398

raise util.Abort(_('bad hash in \'%s\' (only %d bytes long)')

398

raise util.Abort(_('bad hash in \'%s\' (only %d bytes long)')

399

% (filename, len(hash)))

399

% (filename, len(hash)))

400

return hash

400

return hash

401

402

def writehash(hash, filename, executable):

402

def writehash(hash, filename, executable):

403

util.makedirs(os.path.dirname(filename))

403

util.makedirs(os.path.dirname(filename))

404

if os.path.exists(filename):

404

if os.path.exists(filename):

405

os.unlink(filename)

405

os.unlink(filename)

406

wfile = open(filename, 'wb')

406

wfile = open(filename, 'wb')

407

408

try:

408

try:

409

wfile.write(hash)

409

wfile.write(hash)

410

wfile.write('\n')

410

wfile.write('\n')

411

finally:

411

finally:

412

wfile.close()

412

wfile.close()

413

if os.path.exists(filename):

413

if os.path.exists(filename):

414

os.chmod(filename, getmode(executable))

414

os.chmod(filename, getmode(executable))

415

416

def getexecutable(filename):

416

def getexecutable(filename):

417

mode = os.stat(filename).st_mode

417

mode = os.stat(filename).st_mode

418

return ((mode & stat.S_IXUSR) and

418

return ((mode & stat.S_IXUSR) and

419

(mode & stat.S_IXGRP) and

419

(mode & stat.S_IXGRP) and

420

(mode & stat.S_IXOTH))

420

(mode & stat.S_IXOTH))

421

422

def getmode(executable):

422

def getmode(executable):

423

if executable:

423

if executable:

424

return 0755

424

return 0755

425

else:

425

else:

426

return 0644

426

return 0644

427

428

def urljoin(first, second, *arg):

428

def urljoin(first, second, *arg):

429

def join(left, right):

429

def join(left, right):

430

if not left.endswith('/'):

430

if not left.endswith('/'):

431

left += '/'

431

left += '/'

432

if right.startswith('/'):

432

if right.startswith('/'):

433

right = right[1:]

433

right = right[1:]

434

return left + right

434

return left + right

435

436

url = join(first, second)

436

url = join(first, second)

437

for a in arg:

437

for a in arg:

438

url = join(url, a)

438

url = join(url, a)

439

return url

439

return url

440

441

def hexsha1(data):

441

def hexsha1(data):

442

"""hexsha1 returns the hex-encoded sha1 sum of the data in the file-like

442

"""hexsha1 returns the hex-encoded sha1 sum of the data in the file-like

443

object data"""

443

object data"""

444

h = util.sha1()

444

h = util.sha1()

445

for chunk in util.filechunkiter(data):

445

for chunk in util.filechunkiter(data):

446

h.update(chunk)

446

h.update(chunk)

447

return h.hexdigest()

447

return h.hexdigest()

448

449

def httpsendfile(ui, filename):

449

def httpsendfile(ui, filename):

450

return httpconnection.httpsendfile(ui, filename, 'rb')

450

return httpconnection.httpsendfile(ui, filename, 'rb')

451

452

def unixpath(path):

452

def unixpath(path):

453

'''Return a version of path normalized for use with the lfdirstate.'''

453

'''Return a version of path normalized for use with the lfdirstate.'''

454

return os.path.normpath(path).replace(os.sep, '/')

454

return os.path.normpath(path).replace(os.sep, '/')

455

456

def islfilesrepo(repo):

456

def islfilesrepo(repo):

457

return ('largefiles' in repo.requirements and

457

return ('largefiles' in repo.requirements and

458

util.any(shortname + '/' in f[0] for f in repo.store.datafiles()))

458

util.any(shortname + '/' in f[0] for f in repo.store.datafiles()))

459

460

def mkstemp(repo, prefix):

460

def mkstemp(repo, prefix):

461

'''Returns a file descriptor and a filename corresponding to a temporary

461

'''Returns a file descriptor and a filename corresponding to a temporary

462

file in the repo's largefiles store.'''

462

file in the repo's largefiles store.'''

463

path = repo.join(longname)

463

path = repo.join(longname)

464

util.makedirs(path)

464

util.makedirs(path)

465

return tempfile.mkstemp(prefix=prefix, dir=path)

465

return tempfile.mkstemp(prefix=prefix, dir=path)

466

467

class storeprotonotcapable(Exception):

467

class storeprotonotcapable(Exception):

468

def __init__(self, storetypes):

468

def __init__(self, storetypes):

469

self.storetypes = storetypes

469

self.storetypes = storetypes

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # Copyright 2009-2010 Gregory P. Ward
             # Copyright 2009-2010 Intelerad Medical Systems Incorporated
             # Copyright 2010-2011 Fog Creek Software
             # Copyright 2010-2011 Unity Technologies
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             '''largefiles utility code: must not import other modules in this package.'''
             import os
             import errno
             import platform
             import shutil
             import stat
             import tempfile
             from mercurial import dirstate, httpconnection, match as match_, util, scmutil
             from mercurial.i18n import _
             shortname = '.hglf'
             longname = 'largefiles'
             # -- Portability wrappers ----------------------------------------------
             def dirstate_walk(dirstate, matcher, unknown=False, ignored=False):
                 return dirstate.walk(matcher, [], unknown, ignored)
             def repo_add(repo, list):
                 add = repo[None].add
                 return add(list)
             def repo_remove(repo, list, unlink=False):
                 def remove(list, unlink):
                     wlock = repo.wlock()
                     try:
                         if unlink:
                             for f in list:
                                 try:
                                     util.unlinkpath(repo.wjoin(f))
                                 except OSError, inst:
                                     if inst.errno != errno.ENOENT:
                                         raise
                         repo[None].forget(list)
                     finally:
                         wlock.release()
                 return remove(list, unlink=unlink)
             def repo_forget(repo, list):
                 forget = repo[None].forget
                 return forget(list)
             def findoutgoing(repo, remote, force):
                 from mercurial import discovery
                 common, _anyinc, _heads = discovery.findcommonincoming(repo,
                     remote, force=force)
                 return repo.changelog.findmissing(common)
             # -- Private worker functions ------------------------------------------
             def getminsize(ui, assumelfiles, opt, default=10):
                 lfsize = opt
                 if not lfsize and assumelfiles:
                     lfsize = ui.config(longname, 'minsize', default=default)
                 if lfsize:
                     try:
                         lfsize = float(lfsize)
                     except ValueError:
                         raise util.Abort(_('largefiles: size must be number (not %s)\n')
                                          % lfsize)
                 if lfsize is None:
                     raise util.Abort(_('minimum size for largefiles must be specified'))
                 return lfsize
             def link(src, dest):
                 try:
                     util.oslink(src, dest)
                 except OSError:
                     # if hardlinks fail, fallback on atomic copy
                     dst = util.atomictempfile(dest)
-                    for chunk in util.filechunkiter(open(src)):
+                    for chunk in util.filechunkiter(open(src, 'rb')):
                         dst.write(chunk)
                     dst.close()
                     os.chmod(dest, os.stat(src).st_mode)
             def usercachepath(ui, hash):
                 path = ui.configpath(longname, 'usercache', None)
                 if path:
                     path = os.path.join(path, hash)
                 else:
                     if os.name == 'nt':
                         appdata = os.getenv('LOCALAPPDATA', os.getenv('APPDATA'))
                         if appdata:
                             path = os.path.join(appdata, longname, hash)
                     elif platform.system() == 'Darwin':
                         home = os.getenv('HOME')
                         if home:
                             path = os.path.join(home, 'Library', 'Caches',
                                                 longname, hash)
                     elif os.name == 'posix':
                         path = os.getenv('XDG_CACHE_HOME')
                         if path:
                             path = os.path.join(path, longname, hash)
                         else:
                             home = os.getenv('HOME')
                             if home:
                                 path = os.path.join(home, '.cache', longname, hash)
                     else:
                         raise util.Abort(_('unknown operating system: %s\n') % os.name)
                 return path
             def inusercache(ui, hash):
                 path = usercachepath(ui, hash)
                 return path and os.path.exists(path)
             def findfile(repo, hash):
                 if instore(repo, hash):
                     repo.ui.note(_('Found %s in store\n') % hash)
                 elif inusercache(repo.ui, hash):
                     repo.ui.note(_('Found %s in system cache\n') % hash)
                     path = storepath(repo, hash)
                     util.makedirs(os.path.dirname(path))
                     link(usercachepath(repo.ui, hash), path)
                 else:
                     return None
                 return storepath(repo, hash)
             class largefiles_dirstate(dirstate.dirstate):
                 def __getitem__(self, key):
                     return super(largefiles_dirstate, self).__getitem__(unixpath(key))
                 def normal(self, f):
                     return super(largefiles_dirstate, self).normal(unixpath(f))
                 def remove(self, f):
                     return super(largefiles_dirstate, self).remove(unixpath(f))
                 def add(self, f):
                     return super(largefiles_dirstate, self).add(unixpath(f))
                 def drop(self, f):
                     return super(largefiles_dirstate, self).drop(unixpath(f))
                 def forget(self, f):
                     return super(largefiles_dirstate, self).forget(unixpath(f))
             def openlfdirstate(ui, repo):
                 '''
                 Return a dirstate object that tracks largefiles: i.e. its root is
                 the repo root, but it is saved in .hg/largefiles/dirstate.
                 '''
                 admin = repo.join(longname)
                 opener = scmutil.opener(admin)
                 lfdirstate = largefiles_dirstate(opener, ui, repo.root,
                                                  repo.dirstate._validate)
                 # If the largefiles dirstate does not exist, populate and create
                 # it. This ensures that we create it on the first meaningful
                 # largefiles operation in a new clone. It also gives us an easy
                 # way to forcibly rebuild largefiles state:
                 #   rm .hg/largefiles/dirstate && hg status
                 # Or even, if things are really messed up:
                 #   rm -rf .hg/largefiles && hg status
                 if not os.path.exists(os.path.join(admin, 'dirstate')):
                     util.makedirs(admin)
                     matcher = getstandinmatcher(repo)
                     for standin in dirstate_walk(repo.dirstate, matcher):
                         lfile = splitstandin(standin)
                         hash = readstandin(repo, lfile)
                         lfdirstate.normallookup(lfile)
                         try:
                             if hash == hashfile(repo.wjoin(lfile)):
                                 lfdirstate.normal(lfile)
                         except OSError, err:
                             if err.errno != errno.ENOENT:
                                 raise
                     lfdirstate.write()
                 return lfdirstate
             def lfdirstate_status(lfdirstate, repo, rev):
                 wlock = repo.wlock()
                 try:
                     match = match_.always(repo.root, repo.getcwd())
                     s = lfdirstate.status(match, [], False, False, False)
                     unsure, modified, added, removed, missing, unknown, ignored, clean = s
                     for lfile in unsure:
                         if repo[rev][standin(lfile)].data().strip() != \
                                 hashfile(repo.wjoin(lfile)):
                             modified.append(lfile)
                         else:
                             clean.append(lfile)
                             lfdirstate.normal(lfile)
                     lfdirstate.write()
                 finally:
                     wlock.release()
                 return (modified, added, removed, missing, unknown, ignored, clean)
             def listlfiles(repo, rev=None, matcher=None):
                 '''return a list of largefiles in the working copy or the
                 specified changeset'''
                 if matcher is None:
                     matcher = getstandinmatcher(repo)
                 # ignore unknown files in working directory
                 return [splitstandin(f)
                         for f in repo[rev].walk(matcher)
                         if rev is not None or repo.dirstate[f] != '?']
             def instore(repo, hash):
                 return os.path.exists(storepath(repo, hash))
             def storepath(repo, hash):
                 return repo.join(os.path.join(longname, hash))
             def copyfromcache(repo, hash, filename):
                 '''Copy the specified largefile from the repo or system cache to
                 filename in the repository. Return true on success or false if the
                 file was not found in either cache (which should not happened:
                 this is meant to be called only after ensuring that the needed
                 largefile exists in the cache).'''
                 path = findfile(repo, hash)
                 if path is None:
                     return False
                 util.makedirs(os.path.dirname(repo.wjoin(filename)))
                 # The write may fail before the file is fully written, but we
                 # don't use atomic writes in the working copy.
                 shutil.copy(path, repo.wjoin(filename))
                 return True
             def copytostore(repo, rev, file, uploaded=False):
                 hash = readstandin(repo, file)
                 if instore(repo, hash):
                     return
                 copytostoreabsolute(repo, repo.wjoin(file), hash)
             def copytostoreabsolute(repo, file, hash):
                 util.makedirs(os.path.dirname(storepath(repo, hash)))
                 if inusercache(repo.ui, hash):
                     link(usercachepath(repo.ui, hash), storepath(repo, hash))
                 else:
                     dst = util.atomictempfile(storepath(repo, hash))
-                    for chunk in util.filechunkiter(open(file)):
+                    for chunk in util.filechunkiter(open(file, 'rb')):
                         dst.write(chunk)
                     dst.close()
                     util.copymode(file, storepath(repo, hash))
                     linktousercache(repo, hash)
             def linktousercache(repo, hash):
                 path = usercachepath(repo.ui, hash)
                 if path:
                     util.makedirs(os.path.dirname(path))
                     link(storepath(repo, hash), path)
             def getstandinmatcher(repo, pats=[], opts={}):
                 '''Return a match object that applies pats to the standin directory'''
                 standindir = repo.pathto(shortname)
                 if pats:
                     # patterns supplied: search standin directory relative to current dir
                     cwd = repo.getcwd()
                     if os.path.isabs(cwd):
                         # cwd is an absolute path for hg -R <reponame>
                         # work relative to the repository root in this case
                         cwd = ''
                     pats = [os.path.join(standindir, cwd, pat) for pat in pats]
                 elif os.path.isdir(standindir):
                     # no patterns: relative to repo root
                     pats = [standindir]
                 else:
                     # no patterns and no standin dir: return matcher that matches nothing
                     match = match_.match(repo.root, None, [], exact=True)
                     match.matchfn = lambda f: False
                     return match
                 return getmatcher(repo, pats, opts, showbad=False)
             def getmatcher(repo, pats=[], opts={}, showbad=True):
                 '''Wrapper around scmutil.match() that adds showbad: if false,
                 neuter the match object's bad() method so it does not print any
                 warnings about missing files or directories.'''
                 match = scmutil.match(repo[None], pats, opts)
                 if not showbad:
                     match.bad = lambda f, msg: None
                 return match
             def composestandinmatcher(repo, rmatcher):
                 '''Return a matcher that accepts standins corresponding to the
                 files accepted by rmatcher. Pass the list of files in the matcher
                 as the paths specified by the user.'''
                 smatcher = getstandinmatcher(repo, rmatcher.files())
                 isstandin = smatcher.matchfn
                 def composed_matchfn(f):
                     return isstandin(f) and rmatcher.matchfn(splitstandin(f))
                 smatcher.matchfn = composed_matchfn
                 return smatcher
             def standin(filename):
                 '''Return the repo-relative path to the standin for the specified big
                 file.'''
                 # Notes:
                 # 1) Most callers want an absolute path, but _create_standin() needs
                 #    it repo-relative so lfadd() can pass it to repo_add().  So leave
                 #    it up to the caller to use repo.wjoin() to get an absolute path.
                 # 2) Join with '/' because that's what dirstate always uses, even on
                 #    Windows. Change existing separator to '/' first in case we are
                 #    passed filenames from an external source (like the command line).
                 return shortname + '/' + filename.replace(os.sep, '/')
             def isstandin(filename):
                 '''Return true if filename is a big file standin. filename must be
                 in Mercurial's internal form (slash-separated).'''
                 return filename.startswith(shortname + '/')
             def splitstandin(filename):
                 # Split on / because that's what dirstate always uses, even on Windows.
                 # Change local separator to / first just in case we are passed filenames
                 # from an external source (like the command line).
                 bits = filename.replace(os.sep, '/').split('/', 1)
                 if len(bits) == 2 and bits[0] == shortname:
                     return bits[1]
                 else:
                     return None
             def updatestandin(repo, standin):
                 file = repo.wjoin(splitstandin(standin))
                 if os.path.exists(file):
                     hash = hashfile(file)
                     executable = getexecutable(file)
                     writestandin(repo, standin, hash, executable)
             def readstandin(repo, filename, node=None):
                 '''read hex hash from standin for filename at given node, or working
                 directory if no node is given'''
                 return repo[node][standin(filename)].data().strip()
             def writestandin(repo, standin, hash, executable):
                 '''write hash to <repo.root>/<standin>'''
                 writehash(hash, repo.wjoin(standin), executable)
             def copyandhash(instream, outfile):
                 '''Read bytes from instream (iterable) and write them to outfile,
                 computing the SHA-1 hash of the data along the way.  Close outfile
                 when done and return the binary hash.'''
                 hasher = util.sha1('')
                 for data in instream:
                     hasher.update(data)
                     outfile.write(data)
                 # Blecch: closing a file that somebody else opened is rude and
                 # wrong. But it's so darn convenient and practical! After all,
                 # outfile was opened just to copy and hash.
                 outfile.close()
                 return hasher.digest()
             def hashrepofile(repo, file):
                 return hashfile(repo.wjoin(file))
             def hashfile(file):
                 if not os.path.exists(file):
                     return ''
                 hasher = util.sha1('')
                 fd = open(file, 'rb')
                 for data in blockstream(fd):
                     hasher.update(data)
                 fd.close()
                 return hasher.hexdigest()
             class limitreader(object):
                 def __init__(self, f, limit):
                     self.f = f
                     self.limit = limit
                 def read(self, length):
                     if self.limit == 0:
                         return ''
                     length = length > self.limit and self.limit or length
                     self.limit -= length
                     return self.f.read(length)
                 def close(self):
                     pass
             def blockstream(infile, blocksize=128 * 1024):
                 """Generator that yields blocks of data from infile and closes infile."""
                 while True:
                     data = infile.read(blocksize)
                     if not data:
                         break
                     yield data
                 # same blecch as copyandhash() above
                 infile.close()
             def readhash(filename):
                 rfile = open(filename, 'rb')
                 hash = rfile.read(40)
                 rfile.close()
                 if len(hash) < 40:
                     raise util.Abort(_('bad hash in \'%s\' (only %d bytes long)')
                                      % (filename, len(hash)))
                 return hash
             def writehash(hash, filename, executable):
                 util.makedirs(os.path.dirname(filename))
                 if os.path.exists(filename):
                     os.unlink(filename)
                 wfile = open(filename, 'wb')
                 try:
                     wfile.write(hash)
                     wfile.write('\n')
                 finally:
                     wfile.close()
                 if os.path.exists(filename):
                     os.chmod(filename, getmode(executable))
             def getexecutable(filename):
                 mode = os.stat(filename).st_mode
                 return ((mode & stat.S_IXUSR) and
                         (mode & stat.S_IXGRP) and
                         (mode & stat.S_IXOTH))
             def getmode(executable):
                 if executable:
                     return 0755
                 else:
                     return 0644
             def urljoin(first, second, *arg):
                 def join(left, right):
                     if not left.endswith('/'):
                         left += '/'
                     if right.startswith('/'):
                         right = right[1:]
                     return left + right
                 url = join(first, second)
                 for a in arg:
                     url = join(url, a)
                 return url
             def hexsha1(data):
                 """hexsha1 returns the hex-encoded sha1 sum of the data in the file-like
                 object data"""
                 h = util.sha1()
                 for chunk in util.filechunkiter(data):
                     h.update(chunk)
                 return h.hexdigest()
             def httpsendfile(ui, filename):
                 return httpconnection.httpsendfile(ui, filename, 'rb')
             def unixpath(path):
                 '''Return a version of path normalized for use with the lfdirstate.'''
                 return os.path.normpath(path).replace(os.sep, '/')
             def islfilesrepo(repo):
                 return ('largefiles' in repo.requirements and
                         util.any(shortname + '/' in f[0] for f in repo.store.datafiles()))
             def mkstemp(repo, prefix):
                 '''Returns a file descriptor and a filename corresponding to a temporary
                 file in the repo's largefiles store.'''
                 path = repo.join(longname)
                 util.makedirs(path)
                 return tempfile.mkstemp(prefix=prefix, dir=path)
             class storeprotonotcapable(Exception):
                 def __init__(self, storetypes):
                     self.storetypes = storetypes