upstream/mercurial-mirror Commit - r41286:8a699551

1

from __future__ import absolute_import

1

from __future__ import absolute_import

2

3

import errno

3

import errno

4

import hashlib

4

import hashlib

5

import os

5

import os

6

import shutil

6

import shutil

7

import stat

7

import stat

8

import time

8

import time

9

10

from mercurial.i18n import _

10

from mercurial.i18n import _

11

from mercurial.node import bin, hex

11

from mercurial.node import bin, hex

12

from mercurial import (

12

from mercurial import (

13

error,

13

error,

14

pycompat,

14

pycompat,

15

util,

15

util,

16

)

16

)

17

from . import (

17

from . import (

18

constants,

18

constants,

19

shallowutil,

19

shallowutil,

20

)

20

)

21

22

class basestore(object):

22

class basestore(object):

23

def __init__(self, repo, path, reponame, shared=False):

23

def __init__(self, repo, path, reponame, shared=False):

24

"""Creates a remotefilelog store object for the given repo name.

24

"""Creates a remotefilelog store object for the given repo name.

25

26

`path` - The file path where this store keeps its data

26

`path` - The file path where this store keeps its data

27

`reponame` - The name of the repo. This is used to partition data from

27

`reponame` - The name of the repo. This is used to partition data from

28

many repos.

28

many repos.

29

`shared` - True if this store is a shared cache of data from the central

29

`shared` - True if this store is a shared cache of data from the central

30

server, for many repos on this machine. False means this store is for

30

server, for many repos on this machine. False means this store is for

31

the local data for one repo.

31

the local data for one repo.

32

"""

32

"""

33

self.repo = repo

33

self.repo = repo

34

self.ui = repo.ui

34

self.ui = repo.ui

35

self._path = path

35

self._path = path

36

self._reponame = reponame

36

self._reponame = reponame

37

self._shared = shared

37

self._shared = shared

38

self._uid = os.getuid() if not pycompat.iswindows else None

38

self._uid = os.getuid() if not pycompat.iswindows else None

39

40

self._validatecachelog = self.ui.config("remotefilelog",

40

self._validatecachelog = self.ui.config("remotefilelog",

41

"validatecachelog")

41

"validatecachelog")

42

self._validatecache = self.ui.config("remotefilelog", "validatecache",

42

self._validatecache = self.ui.config("remotefilelog", "validatecache",

43

'on')

43

'on')

44

if self._validatecache not in ('on', 'strict', 'off'):

44

if self._validatecache not in ('on', 'strict', 'off'):

45

self._validatecache = 'on'

45

self._validatecache = 'on'

46

if self._validatecache == 'off':

46

if self._validatecache == 'off':

47

self._validatecache = False

47

self._validatecache = False

48

49

if shared:

49

if shared:

50

shallowutil.mkstickygroupdir(self.ui, path)

50

shallowutil.mkstickygroupdir(self.ui, path)

51

52

def getmissing(self, keys):

52

def getmissing(self, keys):

53

missing = []

53

missing = []

54

for name, node in keys:

54

for name, node in keys:

55

filepath = self._getfilepath(name, node)

55

filepath = self._getfilepath(name, node)

56

exists = os.path.exists(filepath)

56

exists = os.path.exists(filepath)

57

if (exists and self._validatecache == 'strict' and

57

if (exists and self._validatecache == 'strict' and

58

not self._validatekey(filepath, 'contains')):

58

not self._validatekey(filepath, 'contains')):

59

exists = False

59

exists = False

60

if not exists:

60

if not exists:

61

missing.append((name, node))

61

missing.append((name, node))

62

63

return missing

63

return missing

64

65

# BELOW THIS ARE IMPLEMENTATIONS OF REPACK SOURCE

65

# BELOW THIS ARE IMPLEMENTATIONS OF REPACK SOURCE

66

67

def markledger(self, ledger, options=None):

67

def markledger(self, ledger, options=None):

68

if options and options.get(constants.OPTION_PACKSONLY):

68

if options and options.get(constants.OPTION_PACKSONLY):

69

return

69

return

70

if self._shared:

70

if self._shared:

71

for filename, nodes in self._getfiles():

71

for filename, nodes in self._getfiles():

72

for node in nodes:

72

for node in nodes:

73

ledger.markdataentry(self, filename, node)

73

ledger.markdataentry(self, filename, node)

74

ledger.markhistoryentry(self, filename, node)

74

ledger.markhistoryentry(self, filename, node)

75

76

def cleanup(self, ledger):

76

def cleanup(self, ledger):

77

ui = self.ui

77

ui = self.ui

78

entries = ledger.sources.get(self, [])

78

entries = ledger.sources.get(self, [])

79

count = 0

79

count = 0

80

progress = ui.makeprogress(_("cleaning up"), unit="files",

80

progress = ui.makeprogress(_("cleaning up"), unit="files",

81

total=len(entries))

81

total=len(entries))

82

for entry in entries:

82

for entry in entries:

83

if entry.gced or (entry.datarepacked and entry.historyrepacked):

83

if entry.gced or (entry.datarepacked and entry.historyrepacked):

84

progress.update(count)

84

progress.update(count)

85

path = self._getfilepath(entry.filename, entry.node)

85

path = self._getfilepath(entry.filename, entry.node)

86

util.tryunlink(path)

86

util.tryunlink(path)

87

count += 1

87

count += 1

88

progress.complete()

88

progress.complete()

89

90

# Clean up the repo cache directory.

90

# Clean up the repo cache directory.

91

self._cleanupdirectory(self._getrepocachepath())

91

self._cleanupdirectory(self._getrepocachepath())

92

93

# BELOW THIS ARE NON-STANDARD APIS

93

# BELOW THIS ARE NON-STANDARD APIS

94

95

def _cleanupdirectory(self, rootdir):

95

def _cleanupdirectory(self, rootdir):

96

"""Removes the empty directories and unnecessary files within the root

96

"""Removes the empty directories and unnecessary files within the root

97

directory recursively. Note that this method does not remove the root

97

directory recursively. Note that this method does not remove the root

98

directory itself. """

98

directory itself. """

99

100

oldfiles = set()

100

oldfiles = set()

101

otherfiles = set()

101

otherfiles = set()

102

# osutil.listdir returns stat information which saves some rmdir/listdir

102

# osutil.listdir returns stat information which saves some rmdir/listdir

103

# syscalls.

103

# syscalls.

104

for name, mode in util.osutil.listdir(rootdir):

104

for name, mode in util.osutil.listdir(rootdir):

105

if stat.S_ISDIR(mode):

105

if stat.S_ISDIR(mode):

106

dirpath = os.path.join(rootdir, name)

106

dirpath = os.path.join(rootdir, name)

107

self._cleanupdirectory(dirpath)

107

self._cleanupdirectory(dirpath)

108

109

# Now that the directory specified by dirpath is potentially

109

# Now that the directory specified by dirpath is potentially

110

# empty, try and remove it.

110

# empty, try and remove it.

111

try:

111

try:

112

os.rmdir(dirpath)

112

os.rmdir(dirpath)

113

except OSError:

113

except OSError:

114

pass

114

pass

115

116

elif stat.S_ISREG(mode):

116

elif stat.S_ISREG(mode):

117

if name.endswith('_old'):

117

if name.endswith('_old'):

118

oldfiles.add(name[:-4])

118

oldfiles.add(name[:-4])

119

else:

119

else:

120

otherfiles.add(name)

120

otherfiles.add(name)

121

122

# Remove the files which end with suffix '_old' and have no

122

# Remove the files which end with suffix '_old' and have no

123

# corresponding file without the suffix '_old'. See addremotefilelognode

123

# corresponding file without the suffix '_old'. See addremotefilelognode

124

# method for the generation/purpose of files with '_old' suffix.

124

# method for the generation/purpose of files with '_old' suffix.

125

for filename in oldfiles - otherfiles:

125

for filename in oldfiles - otherfiles:

126

filepath = os.path.join(rootdir, filename + '_old')

126

filepath = os.path.join(rootdir, filename + '_old')

127

util.tryunlink(filepath)

127

util.tryunlink(filepath)

128

129

def _getfiles(self):

129

def _getfiles(self):

130

"""Return a list of (filename, [node,...]) for all the revisions that

130

"""Return a list of (filename, [node,...]) for all the revisions that

131

exist in the store.

131

exist in the store.

132

133

This is useful for obtaining a list of all the contents of the store

133

This is useful for obtaining a list of all the contents of the store

134

when performing a repack to another store, since the store API requires

134

when performing a repack to another store, since the store API requires

135

name+node keys and not namehash+node keys.

135

name+node keys and not namehash+node keys.

136

"""

136

"""

137

existing = {}

137

existing = {}

138

for filenamehash, node in self._listkeys():

138

for filenamehash, node in self._listkeys():

139

existing.setdefault(filenamehash, []).append(node)

139

existing.setdefault(filenamehash, []).append(node)

140

141

filenamemap = self._resolvefilenames(existing.keys())

141

filenamemap = self._resolvefilenames(existing.keys())

142

143

for filename, sha in filenamemap.iteritems():

143

for filename, sha in filenamemap.iteritems():

144

yield (filename, existing[sha])

144

yield (filename, existing[sha])

145

146

def _resolvefilenames(self, hashes):

146

def _resolvefilenames(self, hashes):

147

"""Given a list of filename hashes that are present in the

147

"""Given a list of filename hashes that are present in the

148

remotefilelog store, return a mapping from filename->hash.

148

remotefilelog store, return a mapping from filename->hash.

149

150

This is useful when converting remotefilelog blobs into other storage

150

This is useful when converting remotefilelog blobs into other storage

151

formats.

151

formats.

152

"""

152

"""

153

if not hashes:

153

if not hashes:

154

return {}

154

return {}

155

156

filenames = {}

156

filenames = {}

157

missingfilename = set(hashes)

157

missingfilename = set(hashes)

158

159

# Start with a full manifest, since it'll cover the majority of files

159

# Start with a full manifest, since it'll cover the majority of files

160

for filename in self.repo['tip'].manifest():

160

for filename in self.repo['tip'].manifest():

161

sha = hashlib.sha1(filename).digest()

161

sha = hashlib.sha1(filename).digest()

162

if sha in missingfilename:

162

if sha in missingfilename:

163

filenames[filename] = sha

163

filenames[filename] = sha

164

missingfilename.discard(sha)

164

missingfilename.discard(sha)

165

166

# Scan the changelog until we've found every file name

166

# Scan the changelog until we've found every file name

167

cl = self.repo.unfiltered().changelog

167

cl = self.repo.unfiltered().changelog

168

for rev in pycompat.xrange(len(cl) - 1, -1, -1):

168

for rev in pycompat.xrange(len(cl) - 1, -1, -1):

169

if not missingfilename:

169

if not missingfilename:

170

break

170

break

171

files = cl.readfiles(cl.node(rev))

171

files = cl.readfiles(cl.node(rev))

172

for filename in files:

172

for filename in files:

173

sha = hashlib.sha1(filename).digest()

173

sha = hashlib.sha1(filename).digest()

174

if sha in missingfilename:

174

if sha in missingfilename:

175

filenames[filename] = sha

175

filenames[filename] = sha

176

missingfilename.discard(sha)

176

missingfilename.discard(sha)

177

178

return filenames

178

return filenames

179

180

def _getrepocachepath(self):

180

def _getrepocachepath(self):

181

return os.path.join(

181

return os.path.join(

182

self._path, self._reponame) if self._shared else self._path

182

self._path, self._reponame) if self._shared else self._path

183

184

def _listkeys(self):

184

def _listkeys(self):

185

"""List all the remotefilelog keys that exist in the store.

185

"""List all the remotefilelog keys that exist in the store.

186

187

Returns a iterator of (filename hash, filecontent hash) tuples.

187

Returns a iterator of (filename hash, filecontent hash) tuples.

188

"""

188

"""

189

190

for root, dirs, files in os.walk(self._getrepocachepath()):

190

for root, dirs, files in os.walk(self._getrepocachepath()):

191

for filename in files:

191

for filename in files:

192

if len(filename) != 40:

192

if len(filename) != 40:

193

continue

193

continue

194

node = filename

194

node = filename

195

if self._shared:

195

if self._shared:

196

# .../1a/85ffda..be21

196

# .../1a/85ffda..be21

197

filenamehash = root[-41:-39] + root[-38:]

197

filenamehash = root[-41:-39] + root[-38:]

198

else:

198

else:

199

filenamehash = root[-40:]

199

filenamehash = root[-40:]

200

yield (bin(filenamehash), bin(node))

200

yield (bin(filenamehash), bin(node))

201

202

def _getfilepath(self, name, node):

202

def _getfilepath(self, name, node):

203

node = hex(node)

203

node = hex(node)

204

if self._shared:

204

if self._shared:

205

key = shallowutil.getcachekey(self._reponame, name, node)

205

key = shallowutil.getcachekey(self._reponame, name, node)

206

else:

206

else:

207

key = shallowutil.getlocalkey(name, node)

207

key = shallowutil.getlocalkey(name, node)

208

209

return os.path.join(self._path, key)

209

return os.path.join(self._path, key)

210

211

def _getdata(self, name, node):

211

def _getdata(self, name, node):

212

filepath = self._getfilepath(name, node)

212

filepath = self._getfilepath(name, node)

213

try:

213

try:

214

data = shallowutil.readfile(filepath)

214

data = shallowutil.readfile(filepath)

215

if self._validatecache and not self._validatedata(data, filepath):

215

if self._validatecache and not self._validatedata(data, filepath):

216

if self._validatecachelog:

216

if self._validatecachelog:

217

with open(self._validatecachelog, 'a+') as f:

217

with open(self._validatecachelog, 'a+') as f:

218

f.write("corrupt %s during read\n" % filepath)

218

f.write("corrupt %s during read\n" % filepath)

219

os.rename(filepath, filepath + ".corrupt")

219

os.rename(filepath, filepath + ".corrupt")

220

raise KeyError("corrupt local cache file %s" % filepath)

220

raise KeyError("corrupt local cache file %s" % filepath)

221

except IOError:

221

except IOError:

222

raise KeyError("no file found at %s for %s:%s" % (filepath, name,

222

raise KeyError("no file found at %s for %s:%s" % (filepath, name,

223

hex(node)))

223

hex(node)))

224

225

return data

225

return data

226

227

def addremotefilelognode(self, name, node, data):

227

def addremotefilelognode(self, name, node, data):

228

filepath = self._getfilepath(name, node)

228

filepath = self._getfilepath(name, node)

229

230

oldumask = os.umask(0o002)

230

oldumask = os.umask(0o002)

231

try:

231

try:

232

# if this node already exists, save the old version for

232

# if this node already exists, save the old version for

233

# recovery/debugging purposes.

233

# recovery/debugging purposes.

234

if os.path.exists(filepath):

234

if os.path.exists(filepath):

235

newfilename = filepath + '_old'

235

newfilename = filepath + '_old'

236

# newfilename can be read-only and shutil.copy will fail.

236

# newfilename can be read-only and shutil.copy will fail.

237

# Delete newfilename to avoid it

237

# Delete newfilename to avoid it

238

if os.path.exists(newfilename):

238

if os.path.exists(newfilename):

239

shallowutil.unlinkfile(newfilename)

239

shallowutil.unlinkfile(newfilename)

240

shutil.copy(filepath, newfilename)

240

shutil.copy(filepath, newfilename)

241

242

shallowutil.mkstickygroupdir(self.ui, os.path.dirname(filepath))

242

shallowutil.mkstickygroupdir(self.ui, os.path.dirname(filepath))

243

shallowutil.writefile(filepath, data, readonly=True)

243

shallowutil.writefile(filepath, data, readonly=True)

244

245

if self._validatecache:

245

if self._validatecache:

246

if not self._validatekey(filepath, 'write'):

246

if not self._validatekey(filepath, 'write'):

247

raise error.Abort(_("local cache write was corrupted %s") %

247

raise error.Abort(_("local cache write was corrupted %s") %

248

filepath)

248

filepath)

249

finally:

249

finally:

250

os.umask(oldumask)

250

os.umask(oldumask)

251

252

def markrepo(self, path):

252

def markrepo(self, path):

253

"""Call this to add the given repo path to the store's list of

253

"""Call this to add the given repo path to the store's list of

254

repositories that are using it. This is useful later when doing garbage

254

repositories that are using it. This is useful later when doing garbage

255

collection, since it allows us to insecpt the repos to see what nodes

255

collection, since it allows us to insecpt the repos to see what nodes

256

they want to be kept alive in the store.

256

they want to be kept alive in the store.

257

"""

257

"""

258

repospath = os.path.join(self._path, "repos")

258

repospath = os.path.join(self._path, "repos")

259

with open(repospath, 'ab') as reposfile:

259

with open(repospath, 'ab') as reposfile:

260

reposfile.write(os.path.dirname(path) + "\n")

260

reposfile.write(os.path.dirname(path) + "\n")

261

262

repospathstat = os.stat(repospath)

262

repospathstat = os.stat(repospath)

263

if repospathstat.st_uid == self._uid:

263

if repospathstat.st_uid == self._uid:

264

os.chmod(repospath, 0o0664)

264

os.chmod(repospath, 0o0664)

265

266

def _validatekey(self, path, action):

266

def _validatekey(self, path, action):

267

with open(path, 'rb') as f:

267

with open(path, 'rb') as f:

268

data = f.read()

268

data = f.read()

269

270

if self._validatedata(data, path):

270

if self._validatedata(data, path):

271

return True

271

return True

272

273

if self._validatecachelog:

273

if self._validatecachelog:

274

with open(self._validatecachelog, 'ab+') as f:

274

with open(self._validatecachelog, 'ab+') as f:

275

f.write("corrupt %s during %s\n" % (path, action))

275

f.write("corrupt %s during %s\n" % (path, action))

276

277

os.rename(path, path + ".corrupt")

277

os.rename(path, path + ".corrupt")

278

return False

278

return False

279

280

def _validatedata(self, data, path):

280

def _validatedata(self, data, path):

281

try:

281

try:

282

if len(data) > 0:

282

if len(data) > 0:

283

# see remotefilelogserver.createfileblob for the format

283

# see remotefilelogserver.createfileblob for the format

284

offset, size, flags = shallowutil.parsesizeflags(data)

284

offset, size, flags = shallowutil.parsesizeflags(data)

285

if len(data) <= size:

285

if len(data) <= size:

286

# it is truncated

286

# it is truncated

287

return False

287

return False

288

289

# extract the node from the metadata

289

# extract the node from the metadata

290

offset += size

290

offset += size

291

datanode = data[offset:offset + 20]

291

datanode = data[offset:offset + 20]

292

293

# and compare against the path

293

# and compare against the path

294

if os.path.basename(path) == hex(datanode):

294

if os.path.basename(path) == hex(datanode):

295

# Content matches the intended path

295

# Content matches the intended path

296

return True

296

return True

297

return False

297

return False

298

except (ValueError, RuntimeError):

298

except (ValueError, RuntimeError):

299

pass

299

pass

300

301

return False

301

return False

302

303

def gc(self, keepkeys):

303

def gc(self, keepkeys):

304

ui = self.ui

304

ui = self.ui

305

cachepath = self._path

305

cachepath = self._path

306

307

# prune cache

307

# prune cache

308

import Queue

308

import Queue

309

queue = Queue.PriorityQueue()

309

queue = Queue.PriorityQueue()

310

originalsize = 0

310

originalsize = 0

311

size = 0

311

size = 0

312

count = 0

312

count = 0

313

removed = 0

313

removed = 0

314

315

# keep files newer than a day even if they aren't needed

315

# keep files newer than a day even if they aren't needed

316

limit = time.time() - (60 * 60 * 24)

316

limit = time.time() - (60 * 60 * 24)

317

318

progress = ui.makeprogress(_("removing unnecessary files"),

318

progress = ui.makeprogress(_("removing unnecessary files"),

319

unit="files")

319

unit="files")

320

progress.update(0)

320

progress.update(0)

321

for root, dirs, files in os.walk(cachepath):

321

for root, dirs, files in os.walk(cachepath):

322

for file in files:

322

for file in files:

323

if file == 'repos':

323

if file == 'repos':

324

continue

324

continue

325

326

# Don't delete pack files

326

# Don't delete pack files

327

if '/packs/' in root:

327

if '/packs/' in root:

328

continue

328

continue

329

330

progress.update(count)

330

progress.update(count)

331

path = os.path.join(root, file)

331

path = os.path.join(root, file)

332

key = os.path.relpath(path, cachepath)

332

key = os.path.relpath(path, cachepath)

333

count += 1

333

count += 1

334

try:

334

try:

335

pathstat = os.stat(path)

335

pathstat = os.stat(path)

336

except OSError as e:

336

except OSError as e:

337

# errno.ENOENT = no such file or directory

337

# errno.ENOENT = no such file or directory

338

if e.errno != errno.ENOENT:

338

if e.errno != errno.ENOENT:

339

raise

339

raise

340

msg = _("warning: file %s was removed by another process\n")

340

msg = _("warning: file %s was removed by another process\n")

341

ui.warn(msg % path)

341

ui.warn(msg % path)

342

continue

342

continue

343

344

originalsize += pathstat.st_size

344

originalsize += pathstat.st_size

345

346

if key in keepkeys or pathstat.st_atime > limit:

346

if key in keepkeys or pathstat.st_atime > limit:

347

queue.put((pathstat.st_atime, path, pathstat))

347

queue.put((pathstat.st_atime, path, pathstat))

348

size += pathstat.st_size

348

size += pathstat.st_size

349

else:

349

else:

350

try:

350

try:

351

shallowutil.unlinkfile(path)

351

shallowutil.unlinkfile(path)

352

except OSError as e:

352

except OSError as e:

353

# errno.ENOENT = no such file or directory

353

# errno.ENOENT = no such file or directory

354

if e.errno != errno.ENOENT:

354

if e.errno != errno.ENOENT:

355

raise

355

raise

356

msg = _("warning: file %s was removed by another "

356

msg = _("warning: file %s was removed by another "

357

"process\n")

357

"process\n")

358

ui.warn(msg % path)

358

ui.warn(msg % path)

359

continue

359

continue

360

removed += 1

360

removed += 1

361

progress.complete()

361

progress.complete()

362

363

# remove oldest files until under limit

363

# remove oldest files until under limit

364

limit = ui.configbytes("remotefilelog", "cachelimit")

364

limit = ui.configbytes("remotefilelog", "cachelimit")

365

if size > limit:

365

if size > limit:

366

excess = size - limit

366

excess = size - limit

367

progress = ui.makeprogress(_("enforcing cache limit"), unit="bytes",

367

progress = ui.makeprogress(_("enforcing cache limit"), unit="bytes",

368

total=excess)

368

total=excess)

369

removedexcess = 0

369

removedexcess = 0

370

while queue and size > limit and size > 0:

370

while queue and size > limit and size > 0:

371

progress.update(removedexcess)

371

progress.update(removedexcess)

372

atime, oldpath, oldpathstat = queue.get()

372

atime, oldpath, oldpathstat = queue.get()

373

try:

373

try:

374

shallowutil.unlinkfile(oldpath)

374

shallowutil.unlinkfile(oldpath)

375

except OSError as e:

375

except OSError as e:

376

# errno.ENOENT = no such file or directory

376

# errno.ENOENT = no such file or directory

377

if e.errno != errno.ENOENT:

377

if e.errno != errno.ENOENT:

378

raise

378

raise

379

msg = _("warning: file %s was removed by another process\n")

379

msg = _("warning: file %s was removed by another process\n")

380

ui.warn(msg % oldpath)

380

ui.warn(msg % oldpath)

381

size -= oldpathstat.st_size

381

size -= oldpathstat.st_size

382

removed += 1

382

removed += 1

383

removedexcess += oldpathstat.st_size

383

removedexcess += oldpathstat.st_size

384

progress.complete()

384

progress.complete()

385

386

ui.status(_("finished: removed %s of %s files (%0.2f GB to %0.2f GB)\n")

386

ui.status(_("finished: removed %s of %s files (%0.2f GB to %0.2f GB)\n")

387

% (removed, count,

387

% (removed, count,

388

float(originalsize) / 1024.0 / 1024.0 / 1024.0,

388

float(originalsize) / 1024.0 / 1024.0 / 1024.0,

389

float(size) / 1024.0 / 1024.0 / 1024.0))

389

float(size) / 1024.0 / 1024.0 / 1024.0))

390

391

class baseunionstore(object):

391

class baseunionstore(object):

392

def __init__(self, *args, **kwargs):

392

def __init__(self, *args, **kwargs):

393

# If one of the functions that iterates all of the stores is about to

393

# If one of the functions that iterates all of the stores is about to

394

# throw a KeyError, try this many times with a full refresh between

394

# throw a KeyError, try this many times with a full refresh between

395

# attempts. A repack operation may have moved data from one store to

395

# attempts. A repack operation may have moved data from one store to

396

# another while we were running.

396

# another while we were running.

397

self.numattempts = kwargs.get(r'numretries', 0) + 1

397

self.numattempts = kwargs.get(r'numretries', 0) + 1

398

# If not-None, call this function on every retry and if the attempts are

398

# If not-None, call this function on every retry and if the attempts are

399

# exhausted.

399

# exhausted.

400

self.retrylog = kwargs.get(r'retrylog', None)

400

self.retrylog = kwargs.get(r'retrylog', None)

401

402

def markforrefresh(self):

402

def markforrefresh(self):

403

for store in self.stores:

403

for store in self.stores:

404

if util.safehasattr(store, 'markforrefresh'):

404

if util.safehasattr(store, 'markforrefresh'):

405

store.markforrefresh()

405

store.markforrefresh()

406

407

@staticmethod

407

@staticmethod

408

def retriable(fn):

408

def retriable(fn):

409

def noop(*args):

409

def noop(*args):

410

pass

410

pass

411

def wrapped(self, *args, **kwargs):

411

def wrapped(self, *args, **kwargs):

412

retrylog = self.retrylog or noop

412

retrylog = self.retrylog or noop

413

funcname = fn.__name__

413

funcname = fn.__name__

414

for i in pycompat.xrange(self.numattempts):

414

for i in pycompat.xrange(self.numattempts):

415

if i > 0:

415

if i > 0:

416

retrylog('re-attempting (n=%d) %s\n' % (i, funcname))

416

retrylog('re-attempting (n=%d) %s\n' % (i, funcname))

417

self.markforrefresh()

417

self.markforrefresh()

418

try:

418

try:

419

return fn(self, *args, **kwargs)

419

return fn(self, *args, **kwargs)

420

except KeyError:

420

except KeyError:

421

pass

421

pass

422

# retries exhausted

422

# retries exhausted

423

retrylog('retries exhausted in %s, raising KeyError\n' % ~~funcname~~)

423

retrylog('retries exhausted in %s, raising KeyError\n' %

424

pycompat.sysbytes(funcname))

424

raise

425

raise

425

return wrapped

426

return wrapped

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             from __future__ import absolute_import
             import errno
             import hashlib
             import os
             import shutil
             import stat
             import time
             from mercurial.i18n import _
             from mercurial.node import bin, hex
             from mercurial import (
                 error,
                 pycompat,
                 util,
             )
             from . import (
                 constants,
                 shallowutil,
             )
             class basestore(object):
                 def __init__(self, repo, path, reponame, shared=False):
                     """Creates a remotefilelog store object for the given repo name.
                     `path` - The file path where this store keeps its data
                     `reponame` - The name of the repo. This is used to partition data from
                     many repos.
                     `shared` - True if this store is a shared cache of data from the central
                     server, for many repos on this machine. False means this store is for
                     the local data for one repo.
                     """
                     self.repo = repo
                     self.ui = repo.ui
                     self._path = path
                     self._reponame = reponame
                     self._shared = shared
                     self._uid = os.getuid() if not pycompat.iswindows else None
                     self._validatecachelog = self.ui.config("remotefilelog",
                                                             "validatecachelog")
                     self._validatecache = self.ui.config("remotefilelog", "validatecache",
                                                          'on')
                     if self._validatecache not in ('on', 'strict', 'off'):
                         self._validatecache = 'on'
                     if self._validatecache == 'off':
                         self._validatecache = False
                     if shared:
                         shallowutil.mkstickygroupdir(self.ui, path)
                 def getmissing(self, keys):
                     missing = []
                     for name, node in keys:
                         filepath = self._getfilepath(name, node)
                         exists = os.path.exists(filepath)
                         if (exists and self._validatecache == 'strict' and
                             not self._validatekey(filepath, 'contains')):
                             exists = False
                         if not exists:
                             missing.append((name, node))
                     return missing
                 # BELOW THIS ARE IMPLEMENTATIONS OF REPACK SOURCE
                 def markledger(self, ledger, options=None):
                     if options and options.get(constants.OPTION_PACKSONLY):
                         return
                     if self._shared:
                         for filename, nodes in self._getfiles():
                             for node in nodes:
                                 ledger.markdataentry(self, filename, node)
                                 ledger.markhistoryentry(self, filename, node)
                 def cleanup(self, ledger):
                     ui = self.ui
                     entries = ledger.sources.get(self, [])
                     count = 0
                     progress = ui.makeprogress(_("cleaning up"), unit="files",
                                                total=len(entries))
                     for entry in entries:
                         if entry.gced or (entry.datarepacked and entry.historyrepacked):
                             progress.update(count)
                             path = self._getfilepath(entry.filename, entry.node)
                             util.tryunlink(path)
                         count += 1
                     progress.complete()
                     # Clean up the repo cache directory.
                     self._cleanupdirectory(self._getrepocachepath())
                 # BELOW THIS ARE NON-STANDARD APIS
                 def _cleanupdirectory(self, rootdir):
                     """Removes the empty directories and unnecessary files within the root
                     directory recursively. Note that this method does not remove the root
                     directory itself. """
                     oldfiles = set()
                     otherfiles = set()
                     # osutil.listdir returns stat information which saves some rmdir/listdir
                     # syscalls.
                     for name, mode in util.osutil.listdir(rootdir):
                         if stat.S_ISDIR(mode):
                             dirpath = os.path.join(rootdir, name)
                             self._cleanupdirectory(dirpath)
                             # Now that the directory specified by dirpath is potentially
                             # empty, try and remove it.
                             try:
                                 os.rmdir(dirpath)
                             except OSError:
                                 pass
                         elif stat.S_ISREG(mode):
                             if name.endswith('_old'):
                                 oldfiles.add(name[:-4])
                             else:
                                 otherfiles.add(name)
                     # Remove the files which end with suffix '_old' and have no
                     # corresponding file without the suffix '_old'. See addremotefilelognode
                     # method for the generation/purpose of files with '_old' suffix.
                     for filename in oldfiles - otherfiles:
                         filepath = os.path.join(rootdir, filename + '_old')
                         util.tryunlink(filepath)
                 def _getfiles(self):
                     """Return a list of (filename, [node,...]) for all the revisions that
                     exist in the store.
                     This is useful for obtaining a list of all the contents of the store
                     when performing a repack to another store, since the store API requires
                     name+node keys and not namehash+node keys.
                     """
                     existing = {}
                     for filenamehash, node in self._listkeys():
                         existing.setdefault(filenamehash, []).append(node)
                     filenamemap = self._resolvefilenames(existing.keys())
                     for filename, sha in filenamemap.iteritems():
                         yield (filename, existing[sha])
                 def _resolvefilenames(self, hashes):
                     """Given a list of filename hashes that are present in the
                     remotefilelog store, return a mapping from filename->hash.
                     This is useful when converting remotefilelog blobs into other storage
                     formats.
                     """
                     if not hashes:
                         return {}
                     filenames = {}
                     missingfilename = set(hashes)
                     # Start with a full manifest, since it'll cover the majority of files
                     for filename in self.repo['tip'].manifest():
                         sha = hashlib.sha1(filename).digest()
                         if sha in missingfilename:
                             filenames[filename] = sha
                             missingfilename.discard(sha)
                     # Scan the changelog until we've found every file name
                     cl = self.repo.unfiltered().changelog
                     for rev in pycompat.xrange(len(cl) - 1, -1, -1):
                         if not missingfilename:
                             break
                         files = cl.readfiles(cl.node(rev))
                         for filename in files:
                             sha = hashlib.sha1(filename).digest()
                             if sha in missingfilename:
                                 filenames[filename] = sha
                                 missingfilename.discard(sha)
                     return filenames
                 def _getrepocachepath(self):
                     return os.path.join(
                         self._path, self._reponame) if self._shared else self._path
                 def _listkeys(self):
                     """List all the remotefilelog keys that exist in the store.
                     Returns a iterator of (filename hash, filecontent hash) tuples.
                     """
                     for root, dirs, files in os.walk(self._getrepocachepath()):
                         for filename in files:
                             if len(filename) != 40:
                                 continue
                             node = filename
                             if self._shared:
                                 # .../1a/85ffda..be21
                                 filenamehash = root[-41:-39] + root[-38:]
                             else:
                                 filenamehash = root[-40:]
                             yield (bin(filenamehash), bin(node))
                 def _getfilepath(self, name, node):
                     node = hex(node)
                     if self._shared:
                         key = shallowutil.getcachekey(self._reponame, name, node)
                     else:
                         key = shallowutil.getlocalkey(name, node)
                     return os.path.join(self._path, key)
                 def _getdata(self, name, node):
                     filepath = self._getfilepath(name, node)
                     try:
                         data = shallowutil.readfile(filepath)
                         if self._validatecache and not self._validatedata(data, filepath):
                             if self._validatecachelog:
                                 with open(self._validatecachelog, 'a+') as f:
                                     f.write("corrupt %s during read\n" % filepath)
                             os.rename(filepath, filepath + ".corrupt")
                             raise KeyError("corrupt local cache file %s" % filepath)
                     except IOError:
                         raise KeyError("no file found at %s for %s:%s" % (filepath, name,
                                                                           hex(node)))
                     return data
                 def addremotefilelognode(self, name, node, data):
                     filepath = self._getfilepath(name, node)
                     oldumask = os.umask(0o002)
                     try:
                         # if this node already exists, save the old version for
                         # recovery/debugging purposes.
                         if os.path.exists(filepath):
                             newfilename = filepath + '_old'
                             # newfilename can be read-only and shutil.copy will fail.
                             # Delete newfilename to avoid it
                             if os.path.exists(newfilename):
                                 shallowutil.unlinkfile(newfilename)
                             shutil.copy(filepath, newfilename)
                         shallowutil.mkstickygroupdir(self.ui, os.path.dirname(filepath))
                         shallowutil.writefile(filepath, data, readonly=True)
                         if self._validatecache:
                             if not self._validatekey(filepath, 'write'):
                                 raise error.Abort(_("local cache write was corrupted %s") %
                                                   filepath)
                     finally:
                         os.umask(oldumask)
                 def markrepo(self, path):
                     """Call this to add the given repo path to the store's list of
                     repositories that are using it. This is useful later when doing garbage
                     collection, since it allows us to insecpt the repos to see what nodes
                     they want to be kept alive in the store.
                     """
                     repospath = os.path.join(self._path, "repos")
                     with open(repospath, 'ab') as reposfile:
                         reposfile.write(os.path.dirname(path) + "\n")
                     repospathstat = os.stat(repospath)
                     if repospathstat.st_uid == self._uid:
                         os.chmod(repospath, 0o0664)
                 def _validatekey(self, path, action):
                     with open(path, 'rb') as f:
                         data = f.read()
                     if self._validatedata(data, path):
                         return True
                     if self._validatecachelog:
                         with open(self._validatecachelog, 'ab+') as f:
                             f.write("corrupt %s during %s\n" % (path, action))
                     os.rename(path, path + ".corrupt")
                     return False
                 def _validatedata(self, data, path):
                     try:
                         if len(data) > 0:
                             # see remotefilelogserver.createfileblob for the format
                             offset, size, flags = shallowutil.parsesizeflags(data)
                             if len(data) <= size:
                                 # it is truncated
                                 return False
                             # extract the node from the metadata
                             offset += size
                             datanode = data[offset:offset + 20]
                             # and compare against the path
                             if os.path.basename(path) == hex(datanode):
                                 # Content matches the intended path
                                 return True
                             return False
                     except (ValueError, RuntimeError):
                         pass
                     return False
                 def gc(self, keepkeys):
                     ui = self.ui
                     cachepath = self._path
                     # prune cache
                     import Queue
                     queue = Queue.PriorityQueue()
                     originalsize = 0
                     size = 0
                     count = 0
                     removed = 0
                     # keep files newer than a day even if they aren't needed
                     limit = time.time() - (60 * 60 * 24)
                     progress = ui.makeprogress(_("removing unnecessary files"),
                                                unit="files")
                     progress.update(0)
                     for root, dirs, files in os.walk(cachepath):
                         for file in files:
                             if file == 'repos':
                                 continue
                             # Don't delete pack files
                             if '/packs/' in root:
                                 continue
                             progress.update(count)
                             path = os.path.join(root, file)
                             key = os.path.relpath(path, cachepath)
                             count += 1
                             try:
                                 pathstat = os.stat(path)
                             except OSError as e:
                                 # errno.ENOENT = no such file or directory
                                 if e.errno != errno.ENOENT:
                                     raise
                                 msg = _("warning: file %s was removed by another process\n")
                                 ui.warn(msg % path)
                                 continue
                             originalsize += pathstat.st_size
                             if key in keepkeys or pathstat.st_atime > limit:
                                 queue.put((pathstat.st_atime, path, pathstat))
                                 size += pathstat.st_size
                             else:
                                 try:
                                     shallowutil.unlinkfile(path)
                                 except OSError as e:
                                     # errno.ENOENT = no such file or directory
                                     if e.errno != errno.ENOENT:
                                         raise
                                     msg = _("warning: file %s was removed by another "
                                             "process\n")
                                     ui.warn(msg % path)
                                     continue
                                 removed += 1
                     progress.complete()
                     # remove oldest files until under limit
                     limit = ui.configbytes("remotefilelog", "cachelimit")
                     if size > limit:
                         excess = size - limit
                         progress = ui.makeprogress(_("enforcing cache limit"), unit="bytes",
                                                    total=excess)
                         removedexcess = 0
                         while queue and size > limit and size > 0:
                             progress.update(removedexcess)
                             atime, oldpath, oldpathstat = queue.get()
                             try:
                                 shallowutil.unlinkfile(oldpath)
                             except OSError as e:
                                 # errno.ENOENT = no such file or directory
                                 if e.errno != errno.ENOENT:
                                     raise
                                 msg = _("warning: file %s was removed by another process\n")
                                 ui.warn(msg % oldpath)
                             size -= oldpathstat.st_size
                             removed += 1
                             removedexcess += oldpathstat.st_size
                         progress.complete()
                     ui.status(_("finished: removed %s of %s files (%0.2f GB to %0.2f GB)\n")
                               % (removed, count,
                                  float(originalsize) / 1024.0 / 1024.0 / 1024.0,
                                  float(size) / 1024.0 / 1024.0 / 1024.0))
             class baseunionstore(object):
                 def __init__(self, *args, **kwargs):
                     # If one of the functions that iterates all of the stores is about to
                     # throw a KeyError, try this many times with a full refresh between
                     # attempts. A repack operation may have moved data from one store to
                     # another while we were running.
                     self.numattempts = kwargs.get(r'numretries', 0) + 1
                     # If not-None, call this function on every retry and if the attempts are
                     # exhausted.
                     self.retrylog = kwargs.get(r'retrylog', None)
                 def markforrefresh(self):
                     for store in self.stores:
                         if util.safehasattr(store, 'markforrefresh'):
                             store.markforrefresh()
                 @staticmethod
                 def retriable(fn):
                     def noop(*args):
                         pass
                     def wrapped(self, *args, **kwargs):
                         retrylog = self.retrylog or noop
                         funcname = fn.__name__
                         for i in pycompat.xrange(self.numattempts):
                             if i > 0:
                                 retrylog('re-attempting (n=%d) %s\n' % (i, funcname))
                                 self.markforrefresh()
                             try:
                                 return fn(self, *args, **kwargs)
                             except KeyError:
                                 pass
                         # retries exhausted
-                        retrylog('retries exhausted in %s, raising KeyError\n' % funcname)
+                        retrylog('retries exhausted in %s, raising KeyError\n' %
+                                 pycompat.sysbytes(funcname))
                         raise
                     return wrapped