upstream/mercurial-mirror Commit - r31445:83e08014

1

# __init__.py - Startup and module loading logic for Mercurial.

1

# __init__.py - Startup and module loading logic for Mercurial.

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

from __future__ import absolute_import

8

from __future__ import absolute_import

9

10

import imp

10

import imp

11

import os

11

import os

12

import sys

12

import sys

13

import zipimport

13

import zipimport

14

15

from . import (

15

from . import (

16

policy

16

policy

17

)

17

)

18

19

__all__ = []

19

__all__ = []

20

21

modulepolicy = policy.policy

21

modulepolicy = policy.policy

22

23

# Modules that have both Python and C implementations. See also the

23

# Modules that have both Python and C implementations. See also the

24

# set of .py files under mercurial/pure/.

24

# set of .py files under mercurial/pure/.

25

_dualmodules = set([

25

_dualmodules = set([

26

'mercurial.base85',

26

'mercurial.base85',

27

'mercurial.bdiff',

27

'mercurial.bdiff',

28

'mercurial.diffhelpers',

28

'mercurial.diffhelpers',

29

'mercurial.mpatch',

29

'mercurial.mpatch',

30

'mercurial.osutil',

30

'mercurial.osutil',

31

'mercurial.parsers',

31

'mercurial.parsers',

32

])

32

])

33

34

class hgimporter(object):

34

class hgimporter(object):

35

"""Object that conforms to import hook interface defined in PEP-302."""

35

"""Object that conforms to import hook interface defined in PEP-302."""

36

def find_module(self, name, path=None):

36

def find_module(self, name, path=None):

37

# We only care about modules that have both C and pure implementations.

37

# We only care about modules that have both C and pure implementations.

38

if name in _dualmodules:

38

if name in _dualmodules:

39

return self

39

return self

40

return None

40

return None

41

42

def load_module(self, name):

42

def load_module(self, name):

43

mod = sys.modules.get(name, None)

43

mod = sys.modules.get(name, None)

44

if mod:

44

if mod:

45

return mod

45

return mod

46

47

mercurial = sys.modules['mercurial']

47

mercurial = sys.modules['mercurial']

48

49

# The zip importer behaves sufficiently differently from the default

49

# The zip importer behaves sufficiently differently from the default

50

# importer to warrant its own code path.

50

# importer to warrant its own code path.

51

loader = getattr(mercurial, '__loader__', None)

51

loader = getattr(mercurial, '__loader__', None)

52

if isinstance(loader, zipimport.zipimporter):

52

if isinstance(loader, zipimport.zipimporter):

53

def ziploader(*paths):

53

def ziploader(*paths):

54

"""Obtain a zipimporter for a directory under the main zip."""

54

"""Obtain a zipimporter for a directory under the main zip."""

55

path = os.path.join(loader.archive, *paths)

55

path = os.path.join(loader.archive, *paths)

56

zl = sys.path_importer_cache.get(path)

56

zl = sys.path_importer_cache.get(path)

57

if not zl:

57

if not zl:

58

zl = zipimport.zipimporter(path)

58

zl = zipimport.zipimporter(path)

59

return zl

59

return zl

60

61

try:

61

try:

62

if modulepolicy in policy.policynoc:

62

if modulepolicy in policy.policynoc:

63

raise ImportError()

63

raise ImportError()

64

65

zl = ziploader('mercurial')

65

zl = ziploader('mercurial')

66

mod = zl.load_module(name)

66

mod = zl.load_module(name)

67

# Unlike imp, ziploader doesn't expose module metadata that

67

# Unlike imp, ziploader doesn't expose module metadata that

68

# indicates the type of module. So just assume what we found

68

# indicates the type of module. So just assume what we found

69

# is OK (even though it could be a pure Python module).

69

# is OK (even though it could be a pure Python module).

70

except ImportError:

70

except ImportError:

71

if modulepolicy == b'c':

71

if modulepolicy == b'c':

72

raise

72

raise

73

zl = ziploader('mercurial', 'pure')

73

zl = ziploader('mercurial', 'pure')

74

mod = zl.load_module(name)

74

mod = zl.load_module(name)

75

76

sys.modules[name] = mod

76

sys.modules[name] = mod

77

return mod

77

return mod

78

79

# Unlike the default importer which searches special locations and

79

# Unlike the default importer which searches special locations and

80

# sys.path, we only look in the directory where "mercurial" was

80

# sys.path, we only look in the directory where "mercurial" was

81

# imported from.

81

# imported from.

82

83

# imp.find_module doesn't support submodules (modules with ".").

83

# imp.find_module doesn't support submodules (modules with ".").

84

# Instead you have to pass the parent package's __path__ attribute

84

# Instead you have to pass the parent package's __path__ attribute

85

# as the path argument.

85

# as the path argument.

86

stem = name.split('.')[-1]

86

stem = name.split('.')[-1]

87

88

try:

88

try:

89

if modulepolicy in policy.policynoc:

89

if modulepolicy in policy.policynoc:

90

raise ImportError()

90

raise ImportError()

91

92

modinfo = imp.find_module(stem, mercurial.__path__)

92

modinfo = imp.find_module(stem, mercurial.__path__)

93

94

# The Mercurial installer used to copy files from

94

# The Mercurial installer used to copy files from

95

# mercurial/pure/*.py to mercurial/*.py. Therefore, it's possible

95

# mercurial/pure/*.py to mercurial/*.py. Therefore, it's possible

96

# for some installations to have .py files under mercurial/*.

96

# for some installations to have .py files under mercurial/*.

97

# Loading Python modules when we expected C versions could result

97

# Loading Python modules when we expected C versions could result

98

# in a) poor performance b) loading a version from a previous

98

# in a) poor performance b) loading a version from a previous

99

# Mercurial version, potentially leading to incompatibility. Either

99

# Mercurial version, potentially leading to incompatibility. Either

100

# scenario is bad. So we verify that modules loaded from

100

# scenario is bad. So we verify that modules loaded from

101

# mercurial/* are C extensions. If the current policy allows the

101

# mercurial/* are C extensions. If the current policy allows the

102

# loading of .py modules, the module will be re-imported from

102

# loading of .py modules, the module will be re-imported from

103

# mercurial/pure/* below.

103

# mercurial/pure/* below.

104

if modinfo[2][2] != imp.C_EXTENSION:

104

if modinfo[2][2] != imp.C_EXTENSION:

105

raise ImportError('.py version of %s found where C '

105

raise ImportError('.py version of %s found where C '

106

'version should exist' % name)

106

'version should exist' % name)

107

108

except ImportError:

108

except ImportError:

109

if modulepolicy == b'c':

109

if modulepolicy == b'c':

110

raise

110

raise

111

112

# Could not load the C extension and pure Python is allowed. So

112

# Could not load the C extension and pure Python is allowed. So

113

# try to load them.

113

# try to load them.

114

from . import pure

114

from . import pure

115

modinfo = imp.find_module(stem, pure.__path__)

115

modinfo = imp.find_module(stem, pure.__path__)

116

if not modinfo:

116

if not modinfo:

117

raise ImportError('could not find mercurial module %s' %

117

raise ImportError('could not find mercurial module %s' %

118

name)

118

name)

119

120

mod = imp.load_module(name, *modinfo)

120

mod = imp.load_module(name, *modinfo)

121

sys.modules[name] = mod

121

sys.modules[name] = mod

122

return mod

122

return mod

123

124

# Python 3 uses a custom module loader that transforms source code between

124

# Python 3 uses a custom module loader that transforms source code between

125

# source file reading and compilation. This is done by registering a custom

125

# source file reading and compilation. This is done by registering a custom

126

# finder that changes the spec for Mercurial modules to use a custom loader.

126

# finder that changes the spec for Mercurial modules to use a custom loader.

127

if sys.version_info[0] >= 3:

127

if sys.version_info[0] >= 3:

128

from . import pure

128

from . import pure

129

import importlib

129

import importlib

130

import io

130

import io

131

import token

131

import token

132

import tokenize

132

import tokenize

133

134

class hgpathentryfinder(importlib.abc.MetaPathFinder):

134

class hgpathentryfinder(importlib.abc.MetaPathFinder):

135

"""A sys.meta_path finder that uses a custom module loader."""

135

"""A sys.meta_path finder that uses a custom module loader."""

136

def find_spec(self, fullname, path, target=None):

136

def find_spec(self, fullname, path, target=None):

137

# Only handle Mercurial-related modules.

137

# Only handle Mercurial-related modules.

138

if not fullname.startswith(('mercurial.', 'hgext.', 'hgext3rd.')):

138

if not fullname.startswith(('mercurial.', 'hgext.', 'hgext3rd.')):

139

return None

139

return None

140

# zstd is already dual-version clean, don't try and mangle it

140

# zstd is already dual-version clean, don't try and mangle it

141

if fullname.startswith('mercurial.zstd'):

141

if fullname.startswith('mercurial.zstd'):

142

return None

142

return None

143

144

# This assumes Python 3 doesn't support loading C modules.

144

# This assumes Python 3 doesn't support loading C modules.

145

if fullname in _dualmodules:

145

if fullname in _dualmodules:

146

stem = fullname.split('.')[-1]

146

stem = fullname.split('.')[-1]

147

fullname = 'mercurial.pure.%s' % stem

147

fullname = 'mercurial.pure.%s' % stem

148

target = pure

148

target = pure

149

assert len(path) == 1

149

assert len(path) == 1

150

path = [os.path.join(path[0], 'pure')]

150

path = [os.path.join(path[0], 'pure')]

151

152

# Try to find the module using other registered finders.

152

# Try to find the module using other registered finders.

153

spec = None

153

spec = None

154

for finder in sys.meta_path:

154

for finder in sys.meta_path:

155

if finder == self:

155

if finder == self:

156

continue

156

continue

157

158

spec = finder.find_spec(fullname, path, target=target)

158

spec = finder.find_spec(fullname, path, target=target)

159

if spec:

159

if spec:

160

break

160

break

161

162

# This is a Mercurial-related module but we couldn't find it

162

# This is a Mercurial-related module but we couldn't find it

163

# using the previously-registered finders. This likely means

163

# using the previously-registered finders. This likely means

164

# the module doesn't exist.

164

# the module doesn't exist.

165

if not spec:

165

if not spec:

166

return None

166

return None

167

168

if fullname.startswith('mercurial.pure.'):

168

if fullname.startswith('mercurial.pure.'):

169

spec.name = spec.name.replace('.pure.', '.')

169

spec.name = spec.name.replace('.pure.', '.')

170

171

# TODO need to support loaders from alternate specs, like zip

171

# TODO need to support loaders from alternate specs, like zip

172

# loaders.

172

# loaders.

173

spec.loader = hgloader(spec.name, spec.origin)

173

spec.loader = hgloader(spec.name, spec.origin)

174

return spec

174

return spec

175

176

def replacetokens(tokens, fullname):

176

def replacetokens(tokens, fullname):

177

"""Transform a stream of tokens from raw to Python 3.

177

"""Transform a stream of tokens from raw to Python 3.

178

179

It is called by the custom module loading machinery to rewrite

179

It is called by the custom module loading machinery to rewrite

180

source/tokens between source decoding and compilation.

180

source/tokens between source decoding and compilation.

181

182

Returns a generator of possibly rewritten tokens.

182

Returns a generator of possibly rewritten tokens.

183

184

The input token list may be mutated as part of processing. However,

184

The input token list may be mutated as part of processing. However,

185

its changes do not necessarily match the output token stream.

185

its changes do not necessarily match the output token stream.

186

187

REMEMBER TO CHANGE ``BYTECODEHEADER`` WHEN CHANGING THIS FUNCTION

187

REMEMBER TO CHANGE ``BYTECODEHEADER`` WHEN CHANGING THIS FUNCTION

188

OR CACHED FILES WON'T GET INVALIDATED PROPERLY.

188

OR CACHED FILES WON'T GET INVALIDATED PROPERLY.

189

"""

189

"""

190

futureimpline = False

190

futureimpline = False

191

192

# The following utility functions access the tokens list and i index of

192

# The following utility functions access the tokens list and i index of

193

# the for i, t enumerate(tokens) loop below

193

# the for i, t enumerate(tokens) loop below

194

def _isop(j, *o):

194

def _isop(j, *o):

195

"""Assert that tokens[j] is an OP with one of the given values"""

195

"""Assert that tokens[j] is an OP with one of the given values"""

196

try:

196

try:

197

return tokens[j].type == token.OP and tokens[j].string in o

197

return tokens[j].type == token.OP and tokens[j].string in o

198

except IndexError:

198

except IndexError:

199

return False

199

return False

200

201

def _findargnofcall(n):

201

def _findargnofcall(n):

202

"""Find arg n of a call expression (start at 0)

202

"""Find arg n of a call expression (start at 0)

203

204

Returns index of the first token of that argument, or None if

204

Returns index of the first token of that argument, or None if

205

there is not that many arguments.

205

there is not that many arguments.

206

207

Assumes that token[i + 1] is '('.

207

Assumes that token[i + 1] is '('.

208

209

"""

209

"""

210

nested = 0

210

nested = 0

211

for j in range(i + 2, len(tokens)):

211

for j in range(i + 2, len(tokens)):

212

if _isop(j, ')', ']', '}'):

212

if _isop(j, ')', ']', '}'):

213

# end of call, tuple, subscription or dict / set

213

# end of call, tuple, subscription or dict / set

214

nested -= 1

214

nested -= 1

215

if nested < 0:

215

if nested < 0:

216

return None

216

return None

217

elif n == 0:

217

elif n == 0:

218

# this is the starting position of arg

218

# this is the starting position of arg

219

return j

219

return j

220

elif _isop(j, '(', '[', '{'):

220

elif _isop(j, '(', '[', '{'):

221

nested += 1

221

nested += 1

222

elif _isop(j, ',') and nested == 0:

222

elif _isop(j, ',') and nested == 0:

223

n -= 1

223

n -= 1

224

225

return None

225

return None

226

227

def _ensureunicode(j):

227

def _ensureunicode(j):

228

"""Make sure the token at j is a unicode string

228

"""Make sure the token at j is a unicode string

229

230

This rewrites a string token to include the unicode literal prefix

230

This rewrites a string token to include the unicode literal prefix

231

so the string transformer won't add the byte prefix.

231

so the string transformer won't add the byte prefix.

232

233

Ignores tokens that are not strings. Assumes bounds checking has

233

Ignores tokens that are not strings. Assumes bounds checking has

234

already been done.

234

already been done.

235

236

"""

236

"""

237

st = tokens[j]

237

st = tokens[j]

238

if st.type == token.STRING and st.string.startswith(("'", '"')):

238

if st.type == token.STRING and st.string.startswith(("'", '"')):

239

tokens[j] = st._replace(string='u%s' % st.string)

239

tokens[j] = st._replace(string='u%s' % st.string)

240

241

for i, t in enumerate(tokens):

241

for i, t in enumerate(tokens):

242

# Convert most string literals to byte literals. String literals

242

# Convert most string literals to byte literals. String literals

243

# in Python 2 are bytes. String literals in Python 3 are unicode.

243

# in Python 2 are bytes. String literals in Python 3 are unicode.

244

# Most strings in Mercurial are bytes and unicode strings are rare.

244

# Most strings in Mercurial are bytes and unicode strings are rare.

245

# Rather than rewrite all string literals to use ``b''`` to indicate

245

# Rather than rewrite all string literals to use ``b''`` to indicate

246

# byte strings, we apply this token transformer to insert the ``b``

246

# byte strings, we apply this token transformer to insert the ``b``

247

# prefix nearly everywhere.

247

# prefix nearly everywhere.

248

if t.type == token.STRING:

248

if t.type == token.STRING:

249

s = t.string

249

s = t.string

250

251

# Preserve docstrings as string literals. This is inconsistent

251

# Preserve docstrings as string literals. This is inconsistent

252

# with regular unprefixed strings. However, the

252

# with regular unprefixed strings. However, the

253

# "from __future__" parsing (which allows a module docstring to

253

# "from __future__" parsing (which allows a module docstring to

254

# exist before it) doesn't properly handle the docstring if it

254

# exist before it) doesn't properly handle the docstring if it

255

# is b''' prefixed, leading to a SyntaxError. We leave all

255

# is b''' prefixed, leading to a SyntaxError. We leave all

256

# docstrings as unprefixed to avoid this. This means Mercurial

256

# docstrings as unprefixed to avoid this. This means Mercurial

257

# components touching docstrings need to handle unicode,

257

# components touching docstrings need to handle unicode,

258

# unfortunately.

258

# unfortunately.

259

if s[0:3] in ("'''", '"""'):

259

if s[0:3] in ("'''", '"""'):

260

yield t

260

yield t

261

continue

261

continue

262

263

# If the first character isn't a quote, it is likely a string

263

# If the first character isn't a quote, it is likely a string

264

# prefixing character (such as 'b', 'u', or 'r'. Ignore.

264

# prefixing character (such as 'b', 'u', or 'r'. Ignore.

265

if s[0] not in ("'", '"'):

265

if s[0] not in ("'", '"'):

266

yield t

266

yield t

267

continue

267

continue

268

269

# String literal. Prefix to make a b'' string.

269

# String literal. Prefix to make a b'' string.

270

yield t._replace(string='b%s' % t.string)

270

yield t._replace(string='b%s' % t.string)

271

continue

271

continue

272

273

# Insert compatibility imports at "from __future__ import" line.

273

# Insert compatibility imports at "from __future__ import" line.

274

# No '\n' should be added to preserve line numbers.

274

# No '\n' should be added to preserve line numbers.

275

if (t.type == token.NAME and t.string == 'import' and

275

if (t.type == token.NAME and t.string == 'import' and

276

all(u.type == token.NAME for u in tokens[i - 2:i]) and

276

all(u.type == token.NAME for u in tokens[i - 2:i]) and

277

[u.string for u in tokens[i - 2:i]] == ['from', '__future__']):

277

[u.string for u in tokens[i - 2:i]] == ['from', '__future__']):

278

futureimpline = True

278

futureimpline = True

279

if t.type == token.NEWLINE and futureimpline:

279

if t.type == token.NEWLINE and futureimpline:

280

futureimpline = False

280

futureimpline = False

281

if fullname == 'mercurial.pycompat':

281

if fullname == 'mercurial.pycompat':

282

yield t

282

yield t

283

continue

283

continue

284

r, c = t.start

284

r, c = t.start

285

l = (b'; from mercurial.pycompat import '

285

l = (b'; from mercurial.pycompat import '

286

b'delattr, getattr, hasattr, setattr, xrange, open\n')

286

b'delattr, getattr, hasattr, setattr, xrange, open\n')

287

for u in tokenize.tokenize(io.BytesIO(l).readline):

287

for u in tokenize.tokenize(io.BytesIO(l).readline):

288

if u.type in (tokenize.ENCODING, token.ENDMARKER):

288

if u.type in (tokenize.ENCODING, token.ENDMARKER):

289

continue

289

continue

290

yield u._replace(

290

yield u._replace(

291

start=(r, c + u.start[1]), end=(r, c + u.end[1]))

291

start=(r, c + u.start[1]), end=(r, c + u.end[1]))

292

continue

292

continue

293

294

# This looks like a function call.

294

# This looks like a function call.

295

if t.type == token.NAME and _isop(i + 1, '('):

295

if t.type == token.NAME and _isop(i + 1, '('):

296

fn = t.string

296

fn = t.string

297

298

# *attr() builtins don't accept byte strings to 2nd argument.

298

# *attr() builtins don't accept byte strings to 2nd argument.

299

if (fn in ('getattr', 'setattr', 'hasattr', 'safehasattr') and

299

if (fn in ('getattr', 'setattr', 'hasattr', 'safehasattr') and

300

not _isop(i - 1, '.')):

300

not _isop(i - 1, '.')):

301

arg1idx = _findargnofcall(1)

301

arg1idx = _findargnofcall(1)

302

if arg1idx is not None:

302

if arg1idx is not None:

303

_ensureunicode(arg1idx)

303

_ensureunicode(arg1idx)

304

305

# .encode() and .decode() on str/bytes/unicode don't accept

305

# .encode() and .decode() on str/bytes/unicode don't accept

306

# byte strings on Python 3.

306

# byte strings on Python 3.

307

elif fn in ('encode', 'decode') and _isop(i - 1, '.'):

307

elif fn in ('encode', 'decode') and _isop(i - 1, '.'):

308

for argn in range(2):

308

for argn in range(2):

309

argidx = _findargnofcall(argn)

309

argidx = _findargnofcall(argn)

310

if argidx is not None:

310

if argidx is not None:

311

_ensureunicode(argidx)

311

_ensureunicode(argidx)

312

313

# It changes iteritems to items as iterite~~ms is~~ not

313

# It changes iteritems/values to items/values as they are not

314

# present in Python 3 world.

314

# present in Python 3 world.

315

elif fn == 'iteritems':

315

elif fn in ('iteritems', 'itervalues'):

316

yield t._replace(string=~~'items'~~)

316

yield t._replace(string=fn[4:])

317

continue

317

continue

318

319

# Emit unmodified token.

319

# Emit unmodified token.

320

yield t

320

yield t

321

322

# Header to add to bytecode files. This MUST be changed when

322

# Header to add to bytecode files. This MUST be changed when

323

# ``replacetoken`` or any mechanism that changes semantics of module

323

# ``replacetoken`` or any mechanism that changes semantics of module

324

# loading is changed. Otherwise cached bytecode may get loaded without

324

# loading is changed. Otherwise cached bytecode may get loaded without

325

# the new transformation mechanisms applied.

325

# the new transformation mechanisms applied.

326

BYTECODEHEADER = b'HG\x00\x08'

326

BYTECODEHEADER = b'HG\x00\x09'

327

328

class hgloader(importlib.machinery.SourceFileLoader):

328

class hgloader(importlib.machinery.SourceFileLoader):

329

"""Custom module loader that transforms source code.

329

"""Custom module loader that transforms source code.

330

331

When the source code is converted to a code object, we transform

331

When the source code is converted to a code object, we transform

332

certain patterns to be Python 3 compatible. This allows us to write code

332

certain patterns to be Python 3 compatible. This allows us to write code

333

that is natively Python 2 and compatible with Python 3 without

333

that is natively Python 2 and compatible with Python 3 without

334

making the code excessively ugly.

334

making the code excessively ugly.

335

336

We do this by transforming the token stream between parse and compile.

336

We do this by transforming the token stream between parse and compile.

337

338

Implementing transformations invalidates caching assumptions made

338

Implementing transformations invalidates caching assumptions made

339

by the built-in importer. The built-in importer stores a header on

339

by the built-in importer. The built-in importer stores a header on

340

saved bytecode files indicating the Python/bytecode version. If the

340

saved bytecode files indicating the Python/bytecode version. If the

341

version changes, the cached bytecode is ignored. The Mercurial

341

version changes, the cached bytecode is ignored. The Mercurial

342

transformations could change at any time. This means we need to check

342

transformations could change at any time. This means we need to check

343

that cached bytecode was generated with the current transformation

343

that cached bytecode was generated with the current transformation

344

code or there could be a mismatch between cached bytecode and what

344

code or there could be a mismatch between cached bytecode and what

345

would be generated from this class.

345

would be generated from this class.

346

347

We supplement the bytecode caching layer by wrapping ``get_data``

347

We supplement the bytecode caching layer by wrapping ``get_data``

348

and ``set_data``. These functions are called when the

348

and ``set_data``. These functions are called when the

349

``SourceFileLoader`` retrieves and saves bytecode cache files,

349

``SourceFileLoader`` retrieves and saves bytecode cache files,

350

respectively. We simply add an additional header on the file. As

350

respectively. We simply add an additional header on the file. As

351

long as the version in this file is changed when semantics change,

351

long as the version in this file is changed when semantics change,

352

cached bytecode should be invalidated when transformations change.

352

cached bytecode should be invalidated when transformations change.

353

354

The added header has the form ``HG<VERSION>``. That is a literal

354

The added header has the form ``HG<VERSION>``. That is a literal

355

``HG`` with 2 binary bytes indicating the transformation version.

355

``HG`` with 2 binary bytes indicating the transformation version.

356

"""

356

"""

357

def get_data(self, path):

357

def get_data(self, path):

358

data = super(hgloader, self).get_data(path)

358

data = super(hgloader, self).get_data(path)

359

360

if not path.endswith(tuple(importlib.machinery.BYTECODE_SUFFIXES)):

360

if not path.endswith(tuple(importlib.machinery.BYTECODE_SUFFIXES)):

361

return data

361

return data

362

363

# There should be a header indicating the Mercurial transformation

363

# There should be a header indicating the Mercurial transformation

364

# version. If it doesn't exist or doesn't match the current version,

364

# version. If it doesn't exist or doesn't match the current version,

365

# we raise an OSError because that is what

365

# we raise an OSError because that is what

366

# ``SourceFileLoader.get_code()`` expects when loading bytecode

366

# ``SourceFileLoader.get_code()`` expects when loading bytecode

367

# paths to indicate the cached file is "bad."

367

# paths to indicate the cached file is "bad."

368

if data[0:2] != b'HG':

368

if data[0:2] != b'HG':

369

raise OSError('no hg header')

369

raise OSError('no hg header')

370

if data[0:4] != BYTECODEHEADER:

370

if data[0:4] != BYTECODEHEADER:

371

raise OSError('hg header version mismatch')

371

raise OSError('hg header version mismatch')

372

373

return data[4:]

373

return data[4:]

374

375

def set_data(self, path, data, *args, **kwargs):

375

def set_data(self, path, data, *args, **kwargs):

376

if path.endswith(tuple(importlib.machinery.BYTECODE_SUFFIXES)):

376

if path.endswith(tuple(importlib.machinery.BYTECODE_SUFFIXES)):

377

data = BYTECODEHEADER + data

377

data = BYTECODEHEADER + data

378

379

return super(hgloader, self).set_data(path, data, *args, **kwargs)

379

return super(hgloader, self).set_data(path, data, *args, **kwargs)

380

381

def source_to_code(self, data, path):

381

def source_to_code(self, data, path):

382

"""Perform token transformation before compilation."""

382

"""Perform token transformation before compilation."""

383

buf = io.BytesIO(data)

383

buf = io.BytesIO(data)

384

tokens = tokenize.tokenize(buf.readline)

384

tokens = tokenize.tokenize(buf.readline)

385

data = tokenize.untokenize(replacetokens(list(tokens), self.name))

385

data = tokenize.untokenize(replacetokens(list(tokens), self.name))

386

# Python's built-in importer strips frames from exceptions raised

386

# Python's built-in importer strips frames from exceptions raised

387

# for this code. Unfortunately, that mechanism isn't extensible

387

# for this code. Unfortunately, that mechanism isn't extensible

388

# and our frame will be blamed for the import failure. There

388

# and our frame will be blamed for the import failure. There

389

# are extremely hacky ways to do frame stripping. We haven't

389

# are extremely hacky ways to do frame stripping. We haven't

390

# implemented them because they are very ugly.

390

# implemented them because they are very ugly.

391

return super(hgloader, self).source_to_code(data, path)

391

return super(hgloader, self).source_to_code(data, path)

392

393

# We automagically register our custom importer as a side-effect of loading.

393

# We automagically register our custom importer as a side-effect of loading.

394

# This is necessary to ensure that any entry points are able to import

394

# This is necessary to ensure that any entry points are able to import

395

# mercurial.* modules without having to perform this registration themselves.

395

# mercurial.* modules without having to perform this registration themselves.

396

if sys.version_info[0] >= 3:

396

if sys.version_info[0] >= 3:

397

_importercls = hgpathentryfinder

397

_importercls = hgpathentryfinder

398

else:

398

else:

399

_importercls = hgimporter

399

_importercls = hgimporter

400

if not any(isinstance(x, _importercls) for x in sys.meta_path):

400

if not any(isinstance(x, _importercls) for x in sys.meta_path):

401

# meta_path is used before any implicit finders and before sys.path.

401

# meta_path is used before any implicit finders and before sys.path.

402

sys.meta_path.insert(0, _importercls())

402

sys.meta_path.insert(0, _importercls())

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # __init__.py - Startup and module loading logic for Mercurial.
             #
             # Copyright 2015 Gregory Szorc <gregory.szorc@gmail.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from __future__ import absolute_import
             import imp
             import os
             import sys
             import zipimport
             from . import (
                 policy
             )
             __all__ = []
             modulepolicy = policy.policy
             # Modules that have both Python and C implementations. See also the
             # set of .py files under mercurial/pure/.
             _dualmodules = set([
                 'mercurial.base85',
                 'mercurial.bdiff',
                 'mercurial.diffhelpers',
                 'mercurial.mpatch',
                 'mercurial.osutil',
                 'mercurial.parsers',
             ])
             class hgimporter(object):
                 """Object that conforms to import hook interface defined in PEP-302."""
                 def find_module(self, name, path=None):
                     # We only care about modules that have both C and pure implementations.
                     if name in _dualmodules:
                         return self
                     return None
                 def load_module(self, name):
                     mod = sys.modules.get(name, None)
                     if mod:
                         return mod
                     mercurial = sys.modules['mercurial']
                     # The zip importer behaves sufficiently differently from the default
                     # importer to warrant its own code path.
                     loader = getattr(mercurial, '__loader__', None)
                     if isinstance(loader, zipimport.zipimporter):
                         def ziploader(*paths):
                             """Obtain a zipimporter for a directory under the main zip."""
                             path = os.path.join(loader.archive, *paths)
                             zl = sys.path_importer_cache.get(path)
                             if not zl:
                                 zl = zipimport.zipimporter(path)
                             return zl
                         try:
                             if modulepolicy in policy.policynoc:
                                 raise ImportError()
                             zl = ziploader('mercurial')
                             mod = zl.load_module(name)
                             # Unlike imp, ziploader doesn't expose module metadata that
                             # indicates the type of module. So just assume what we found
                             # is OK (even though it could be a pure Python module).
                         except ImportError:
                             if modulepolicy == b'c':
                                 raise
                             zl = ziploader('mercurial', 'pure')
                             mod = zl.load_module(name)
                         sys.modules[name] = mod
                         return mod
                     # Unlike the default importer which searches special locations and
                     # sys.path, we only look in the directory where "mercurial" was
                     # imported from.
                     # imp.find_module doesn't support submodules (modules with ".").
                     # Instead you have to pass the parent package's __path__ attribute
                     # as the path argument.
                     stem = name.split('.')[-1]
                     try:
                         if modulepolicy in policy.policynoc:
                             raise ImportError()
                         modinfo = imp.find_module(stem, mercurial.__path__)
                         # The Mercurial installer used to copy files from
                         # mercurial/pure/*.py to mercurial/*.py. Therefore, it's possible
                         # for some installations to have .py files under mercurial/*.
                         # Loading Python modules when we expected C versions could result
                         # in a) poor performance b) loading a version from a previous
                         # Mercurial version, potentially leading to incompatibility. Either
                         # scenario is bad. So we verify that modules loaded from
                         # mercurial/* are C extensions. If the current policy allows the
                         # loading of .py modules, the module will be re-imported from
                         # mercurial/pure/* below.
                         if modinfo[2][2] != imp.C_EXTENSION:
                             raise ImportError('.py version of %s found where C '
                                               'version should exist' % name)
                     except ImportError:
                         if modulepolicy == b'c':
                             raise
                         # Could not load the C extension and pure Python is allowed. So
                         # try to load them.
                         from . import pure
                         modinfo = imp.find_module(stem, pure.__path__)
                         if not modinfo:
                             raise ImportError('could not find mercurial module %s' %
                                               name)
                     mod = imp.load_module(name, *modinfo)
                     sys.modules[name] = mod
                     return mod
             # Python 3 uses a custom module loader that transforms source code between
             # source file reading and compilation. This is done by registering a custom
             # finder that changes the spec for Mercurial modules to use a custom loader.
             if sys.version_info[0] >= 3:
                 from . import pure
                 import importlib
                 import io
                 import token
                 import tokenize
                 class hgpathentryfinder(importlib.abc.MetaPathFinder):
                     """A sys.meta_path finder that uses a custom module loader."""
                     def find_spec(self, fullname, path, target=None):
                         # Only handle Mercurial-related modules.
                         if not fullname.startswith(('mercurial.', 'hgext.', 'hgext3rd.')):
                             return None
                         # zstd is already dual-version clean, don't try and mangle it
                         if fullname.startswith('mercurial.zstd'):
                             return None
                         # This assumes Python 3 doesn't support loading C modules.
                         if fullname in _dualmodules:
                             stem = fullname.split('.')[-1]
                             fullname = 'mercurial.pure.%s' % stem
                             target = pure
                             assert len(path) == 1
                             path = [os.path.join(path[0], 'pure')]
                         # Try to find the module using other registered finders.
                         spec = None
                         for finder in sys.meta_path:
                             if finder == self:
                                 continue
                             spec = finder.find_spec(fullname, path, target=target)
                             if spec:
                                 break
                         # This is a Mercurial-related module but we couldn't find it
                         # using the previously-registered finders. This likely means
                         # the module doesn't exist.
                         if not spec:
                             return None
                         if fullname.startswith('mercurial.pure.'):
                             spec.name = spec.name.replace('.pure.', '.')
                         # TODO need to support loaders from alternate specs, like zip
                         # loaders.
                         spec.loader = hgloader(spec.name, spec.origin)
                         return spec
                 def replacetokens(tokens, fullname):
                     """Transform a stream of tokens from raw to Python 3.
                     It is called by the custom module loading machinery to rewrite
                     source/tokens between source decoding and compilation.
                     Returns a generator of possibly rewritten tokens.
                     The input token list may be mutated as part of processing. However,
                     its changes do not necessarily match the output token stream.
                     REMEMBER TO CHANGE ``BYTECODEHEADER`` WHEN CHANGING THIS FUNCTION
                     OR CACHED FILES WON'T GET INVALIDATED PROPERLY.
                     """
                     futureimpline = False
                     # The following utility functions access the tokens list and i index of
                     # the for i, t enumerate(tokens) loop below
                     def _isop(j, *o):
                         """Assert that tokens[j] is an OP with one of the given values"""
                         try:
                             return tokens[j].type == token.OP and tokens[j].string in o
                         except IndexError:
                             return False
                     def _findargnofcall(n):
                         """Find arg n of a call expression (start at 0)
                         Returns index of the first token of that argument, or None if
                         there is not that many arguments.
                         Assumes that token[i + 1] is '('.
                         """
                         nested = 0
                         for j in range(i + 2, len(tokens)):
                             if _isop(j, ')', ']', '}'):
                                 # end of call, tuple, subscription or dict / set
                                 nested -= 1
                                 if nested < 0:
                                     return None
                             elif n == 0:
                                 # this is the starting position of arg
                                 return j
                             elif _isop(j, '(', '[', '{'):
                                 nested += 1
                             elif _isop(j, ',') and nested == 0:
                                 n -= 1
                         return None
                     def _ensureunicode(j):
                         """Make sure the token at j is a unicode string
                         This rewrites a string token to include the unicode literal prefix
                         so the string transformer won't add the byte prefix.
                         Ignores tokens that are not strings. Assumes bounds checking has
                         already been done.
                         """
                         st = tokens[j]
                         if st.type == token.STRING and st.string.startswith(("'", '"')):
                             tokens[j] = st._replace(string='u%s' % st.string)
                     for i, t in enumerate(tokens):
                         # Convert most string literals to byte literals. String literals
                         # in Python 2 are bytes. String literals in Python 3 are unicode.
                         # Most strings in Mercurial are bytes and unicode strings are rare.
                         # Rather than rewrite all string literals to use ``b''`` to indicate
                         # byte strings, we apply this token transformer to insert the ``b``
                         # prefix nearly everywhere.
                         if t.type == token.STRING:
                             s = t.string
                             # Preserve docstrings as string literals. This is inconsistent
                             # with regular unprefixed strings. However, the
                             # "from __future__" parsing (which allows a module docstring to
                             # exist before it) doesn't properly handle the docstring if it
                             # is b''' prefixed, leading to a SyntaxError. We leave all
                             # docstrings as unprefixed to avoid this. This means Mercurial
                             # components touching docstrings need to handle unicode,
                             # unfortunately.
                             if s[0:3] in ("'''", '"""'):
                                 yield t
                                 continue
                             # If the first character isn't a quote, it is likely a string
                             # prefixing character (such as 'b', 'u', or 'r'. Ignore.
                             if s[0] not in ("'", '"'):
                                 yield t
                                 continue
                             # String literal. Prefix to make a b'' string.
                             yield t._replace(string='b%s' % t.string)
                             continue
                         # Insert compatibility imports at "from __future__ import" line.
                         # No '\n' should be added to preserve line numbers.
                         if (t.type == token.NAME and t.string == 'import' and
                             all(u.type == token.NAME for u in tokens[i - 2:i]) and
                             [u.string for u in tokens[i - 2:i]] == ['from', '__future__']):
                             futureimpline = True
                         if t.type == token.NEWLINE and futureimpline:
                             futureimpline = False
                             if fullname == 'mercurial.pycompat':
                                 yield t
                                 continue
                             r, c = t.start
                             l = (b'; from mercurial.pycompat import '
                                  b'delattr, getattr, hasattr, setattr, xrange, open\n')
                             for u in tokenize.tokenize(io.BytesIO(l).readline):
                                 if u.type in (tokenize.ENCODING, token.ENDMARKER):
                                     continue
                                 yield u._replace(
                                     start=(r, c + u.start[1]), end=(r, c + u.end[1]))
                             continue
                         # This looks like a function call.
                         if t.type == token.NAME and _isop(i + 1, '('):
                             fn = t.string
                             # *attr() builtins don't accept byte strings to 2nd argument.
                             if (fn in ('getattr', 'setattr', 'hasattr', 'safehasattr') and
                                     not _isop(i - 1, '.')):
                                 arg1idx = _findargnofcall(1)
                                 if arg1idx is not None:
                                     _ensureunicode(arg1idx)
                             # .encode() and .decode() on str/bytes/unicode don't accept
                             # byte strings on Python 3.
                             elif fn in ('encode', 'decode') and _isop(i - 1, '.'):
                                 for argn in range(2):
                                     argidx = _findargnofcall(argn)
                                     if argidx is not None:
                                         _ensureunicode(argidx)
-                            # It changes iteritems to items as iteritems is not
+                            # It changes iteritems/values to items/values as they are not
                             # present in Python 3 world.
-                            elif fn == 'iteritems':
+                            elif fn in ('iteritems', 'itervalues'):
-                                yield t._replace(string='items')
+                                yield t._replace(string=fn[4:])
                                 continue
                         # Emit unmodified token.
                         yield t
                 # Header to add to bytecode files. This MUST be changed when
                 # ``replacetoken`` or any mechanism that changes semantics of module
                 # loading is changed. Otherwise cached bytecode may get loaded without
                 # the new transformation mechanisms applied.
-                BYTECODEHEADER = b'HG\x00\x08'
+                BYTECODEHEADER = b'HG\x00\x09'
                 class hgloader(importlib.machinery.SourceFileLoader):
                     """Custom module loader that transforms source code.
                     When the source code is converted to a code object, we transform
                     certain patterns to be Python 3 compatible. This allows us to write code
                     that is natively Python 2 and compatible with Python 3 without
                     making the code excessively ugly.
                     We do this by transforming the token stream between parse and compile.
                     Implementing transformations invalidates caching assumptions made
                     by the built-in importer. The built-in importer stores a header on
                     saved bytecode files indicating the Python/bytecode version. If the
                     version changes, the cached bytecode is ignored. The Mercurial
                     transformations could change at any time. This means we need to check
                     that cached bytecode was generated with the current transformation
                     code or there could be a mismatch between cached bytecode and what
                     would be generated from this class.
                     We supplement the bytecode caching layer by wrapping ``get_data``
                     and ``set_data``. These functions are called when the
                     ``SourceFileLoader`` retrieves and saves bytecode cache files,
                     respectively. We simply add an additional header on the file. As
                     long as the version in this file is changed when semantics change,
                     cached bytecode should be invalidated when transformations change.
                     The added header has the form ``HG<VERSION>``. That is a literal
                     ``HG`` with 2 binary bytes indicating the transformation version.
                     """
                     def get_data(self, path):
                         data = super(hgloader, self).get_data(path)
                         if not path.endswith(tuple(importlib.machinery.BYTECODE_SUFFIXES)):
                             return data
                         # There should be a header indicating the Mercurial transformation
                         # version. If it doesn't exist or doesn't match the current version,
                         # we raise an OSError because that is what
                         # ``SourceFileLoader.get_code()`` expects when loading bytecode
                         # paths to indicate the cached file is "bad."
                         if data[0:2] != b'HG':
                             raise OSError('no hg header')
                         if data[0:4] != BYTECODEHEADER:
                             raise OSError('hg header version mismatch')
                         return data[4:]
                     def set_data(self, path, data, *args, **kwargs):
                         if path.endswith(tuple(importlib.machinery.BYTECODE_SUFFIXES)):
                             data = BYTECODEHEADER + data
                         return super(hgloader, self).set_data(path, data, *args, **kwargs)
                     def source_to_code(self, data, path):
                         """Perform token transformation before compilation."""
                         buf = io.BytesIO(data)
                         tokens = tokenize.tokenize(buf.readline)
                         data = tokenize.untokenize(replacetokens(list(tokens), self.name))
                         # Python's built-in importer strips frames from exceptions raised
                         # for this code. Unfortunately, that mechanism isn't extensible
                         # and our frame will be blamed for the import failure. There
                         # are extremely hacky ways to do frame stripping. We haven't
                         # implemented them because they are very ugly.
                         return super(hgloader, self).source_to_code(data, path)
             # We automagically register our custom importer as a side-effect of loading.
             # This is necessary to ensure that any entry points are able to import
             # mercurial.* modules without having to perform this registration themselves.
             if sys.version_info[0] >= 3:
                 _importercls = hgpathentryfinder
             else:
                 _importercls = hgimporter
             if not any(isinstance(x, _importercls) for x in sys.meta_path):
                 # meta_path is used before any implicit finders and before sys.path.
                 sys.meta_path.insert(0, _importercls())