upstream/mercurial-mirror Commit - r42153:95e4ae86

1

# patch.py - patch file parsing routines

1

# patch.py - patch file parsing routines

2

#

2

#

3

4

5

#

5

#

6

# This software may be used and distributed according to the terms of the

6

# This software may be used and distributed according to the terms of the

7

# GNU General Public License version 2 or any later version.

7

# GNU General Public License version 2 or any later version.

8

9

from __future__ import absolute_import, print_function

9

from __future__ import absolute_import, print_function

10

11

import collections

11

import collections

12

import contextlib

12

import contextlib

13

import copy

13

import copy

14

import email

14

import email

15

import errno

15

import errno

16

import hashlib

16

import hashlib

17

import os

17

import os

18

import re

18

import re

19

import shutil

19

import shutil

20

import zlib

20

import zlib

21

22

from .i18n import _

22

from .i18n import _

23

from .node import (

23

from .node import (

24

hex,

24

hex,

25

short,

25

short,

26

)

26

)

27

from . import (

27

from . import (

28

copies,

28

copies,

29

diffhelper,

29

diffhelper,

30

diffutil,

30

diffutil,

31

encoding,

31

encoding,

32

error,

32

error,

33

mail,

33

mail,

34

mdiff,

34

mdiff,

35

pathutil,

35

pathutil,

36

pycompat,

36

pycompat,

37

scmutil,

37

scmutil,

38

similar,

38

similar,

39

util,

39

util,

40

vfs as vfsmod,

40

vfs as vfsmod,

41

)

41

)

42

from .utils import (

42

from .utils import (

43

dateutil,

43

dateutil,

44

procutil,

44

procutil,

45

stringutil,

45

stringutil,

46

)

46

)

47

48

stringio = util.stringio

48

stringio = util.stringio

49

50

gitre = re.compile(br'diff --git a/(.*) b/(.*)')

50

gitre = re.compile(br'diff --git a/(.*) b/(.*)')

51

tabsplitter = re.compile(br'(\t+|[^\t]+)')

51

tabsplitter = re.compile(br'(\t+|[^\t]+)')

52

wordsplitter = re.compile(br'(\t+| +|[a-zA-Z0-9_\x80-\xff]+|'

52

wordsplitter = re.compile(br'(\t+| +|[a-zA-Z0-9_\x80-\xff]+|'

53

b'[^ \ta-zA-Z0-9_\x80-\xff])')

53

b'[^ \ta-zA-Z0-9_\x80-\xff])')

54

55

PatchError = error.PatchError

55

PatchError = error.PatchError

56

57

# public functions

57

# public functions

58

59

def split(stream):

59

def split(stream):

60

'''return an iterator of individual patches from a stream'''

60

'''return an iterator of individual patches from a stream'''

61

def isheader(line, inheader):

61

def isheader(line, inheader):

62

if inheader and line.startswith((' ', '\t')):

62

if inheader and line.startswith((' ', '\t')):

63

# continuation

63

# continuation

64

return True

64

return True

65

if line.startswith((' ', '-', '+')):

65

if line.startswith((' ', '-', '+')):

66

# diff line - don't check for header pattern in there

66

# diff line - don't check for header pattern in there

67

return False

67

return False

68

l = line.split(': ', 1)

68

l = line.split(': ', 1)

69

return len(l) == 2 and ' ' not in l[0]

69

return len(l) == 2 and ' ' not in l[0]

70

71

def chunk(lines):

71

def chunk(lines):

72

return stringio(''.join(lines))

72

return stringio(''.join(lines))

73

74

def hgsplit(stream, cur):

74

def hgsplit(stream, cur):

75

inheader = True

75

inheader = True

76

77

for line in stream:

77

for line in stream:

78

if not line.strip():

78

if not line.strip():

79

inheader = False

79

inheader = False

80

if not inheader and line.startswith('# HG changeset patch'):

80

if not inheader and line.startswith('# HG changeset patch'):

81

yield chunk(cur)

81

yield chunk(cur)

82

cur = []

82

cur = []

83

inheader = True

83

inheader = True

84

85

cur.append(line)

85

cur.append(line)

86

87

if cur:

87

if cur:

88

yield chunk(cur)

88

yield chunk(cur)

89

90

def mboxsplit(stream, cur):

90

def mboxsplit(stream, cur):

91

for line in stream:

91

for line in stream:

92

if line.startswith('From '):

92

if line.startswith('From '):

93

for c in split(chunk(cur[1:])):

93

for c in split(chunk(cur[1:])):

94

yield c

94

yield c

95

cur = []

95

cur = []

96

97

cur.append(line)

97

cur.append(line)

98

99

if cur:

99

if cur:

100

for c in split(chunk(cur[1:])):

100

for c in split(chunk(cur[1:])):

101

yield c

101

yield c

102

103

def mimesplit(stream, cur):

103

def mimesplit(stream, cur):

104

def msgfp(m):

104

def msgfp(m):

105

fp = stringio()

105

fp = stringio()

106

g = email.Generator.Generator(fp, mangle_from_=False)

106

g = email.Generator.Generator(fp, mangle_from_=False)

107

g.flatten(m)

107

g.flatten(m)

108

fp.seek(0)

108

fp.seek(0)

109

return fp

109

return fp

110

111

for line in stream:

111

for line in stream:

112

cur.append(line)

112

cur.append(line)

113

c = chunk(cur)

113

c = chunk(cur)

114

115

m = mail.parse(c)

115

m = mail.parse(c)

116

if not m.is_multipart():

116

if not m.is_multipart():

117

yield msgfp(m)

117

yield msgfp(m)

118

else:

118

else:

119

ok_types = ('text/plain', 'text/x-diff', 'text/x-patch')

119

ok_types = ('text/plain', 'text/x-diff', 'text/x-patch')

120

for part in m.walk():

120

for part in m.walk():

121

ct = part.get_content_type()

121

ct = part.get_content_type()

122

if ct not in ok_types:

122

if ct not in ok_types:

123

continue

123

continue

124

yield msgfp(part)

124

yield msgfp(part)

125

126

def headersplit(stream, cur):

126

def headersplit(stream, cur):

127

inheader = False

127

inheader = False

128

129

for line in stream:

129

for line in stream:

130

if not inheader and isheader(line, inheader):

130

if not inheader and isheader(line, inheader):

131

yield chunk(cur)

131

yield chunk(cur)

132

cur = []

132

cur = []

133

inheader = True

133

inheader = True

134

if inheader and not isheader(line, inheader):

134

if inheader and not isheader(line, inheader):

135

inheader = False

135

inheader = False

136

137

cur.append(line)

137

cur.append(line)

138

139

if cur:

139

if cur:

140

yield chunk(cur)

140

yield chunk(cur)

141

142

def remainder(cur):

142

def remainder(cur):

143

yield chunk(cur)

143

yield chunk(cur)

144

145

class fiter(object):

145

class fiter(object):

146

def __init__(self, fp):

146

def __init__(self, fp):

147

self.fp = fp

147

self.fp = fp

148

149

def __iter__(self):

149

def __iter__(self):

150

return self

150

return self

151

152

def next(self):

152

def next(self):

153

l = self.fp.readline()

153

l = self.fp.readline()

154

if not l:

154

if not l:

155

raise StopIteration

155

raise StopIteration

156

return l

156

return l

157

158

__next__ = next

158

__next__ = next

159

160

inheader = False

160

inheader = False

161

cur = []

161

cur = []

162

163

mimeheaders = ['content-type']

163

mimeheaders = ['content-type']

164

165

if not util.safehasattr(stream, 'next'):

165

if not util.safehasattr(stream, 'next'):

166

# http responses, for example, have readline but not next

166

# http responses, for example, have readline but not next

167

stream = fiter(stream)

167

stream = fiter(stream)

168

169

for line in stream:

169

for line in stream:

170

cur.append(line)

170

cur.append(line)

171

if line.startswith('# HG changeset patch'):

171

if line.startswith('# HG changeset patch'):

172

return hgsplit(stream, cur)

172

return hgsplit(stream, cur)

173

elif line.startswith('From '):

173

elif line.startswith('From '):

174

return mboxsplit(stream, cur)

174

return mboxsplit(stream, cur)

175

elif isheader(line, inheader):

175

elif isheader(line, inheader):

176

inheader = True

176

inheader = True

177

if line.split(':', 1)[0].lower() in mimeheaders:

177

if line.split(':', 1)[0].lower() in mimeheaders:

178

# let email parser handle this

178

# let email parser handle this

179

return mimesplit(stream, cur)

179

return mimesplit(stream, cur)

180

elif line.startswith('--- ') and inheader:

180

elif line.startswith('--- ') and inheader:

181

# No evil headers seen by diff start, split by hand

181

# No evil headers seen by diff start, split by hand

182

return headersplit(stream, cur)

182

return headersplit(stream, cur)

183

# Not enough info, keep reading

183

# Not enough info, keep reading

184

185

# if we are here, we have a very plain patch

185

# if we are here, we have a very plain patch

186

return remainder(cur)

186

return remainder(cur)

187

188

## Some facility for extensible patch parsing:

188

## Some facility for extensible patch parsing:

189

# list of pairs ("header to match", "data key")

189

# list of pairs ("header to match", "data key")

190

patchheadermap = [('Date', 'date'),

190

patchheadermap = [('Date', 'date'),

191

('Branch', 'branch'),

191

('Branch', 'branch'),

192

('Node ID', 'nodeid'),

192

('Node ID', 'nodeid'),

193

]

193

]

194

195

@contextlib.contextmanager

195

@contextlib.contextmanager

196

def extract(ui, fileobj):

196

def extract(ui, fileobj):

197

'''extract patch from data read from fileobj.

197

'''extract patch from data read from fileobj.

198

199

patch can be a normal patch or contained in an email message.

199

patch can be a normal patch or contained in an email message.

200

201

return a dictionary. Standard keys are:

201

return a dictionary. Standard keys are:

202

- filename,

202

- filename,

203

- message,

203

- message,

204

- user,

204

- user,

205

- date,

205

- date,

206

- branch,

206

- branch,

207

- node,

207

- node,

208

- p1,

208

- p1,

209

- p2.

209

- p2.

210

Any item can be missing from the dictionary. If filename is missing,

210

Any item can be missing from the dictionary. If filename is missing,

211

fileobj did not contain a patch. Caller must unlink filename when done.'''

211

fileobj did not contain a patch. Caller must unlink filename when done.'''

212

213

fd, tmpname = pycompat.mkstemp(prefix='hg-patch-')

213

fd, tmpname = pycompat.mkstemp(prefix='hg-patch-')

214

tmpfp = os.fdopen(fd, r'wb')

214

tmpfp = os.fdopen(fd, r'wb')

215

try:

215

try:

216

yield _extract(ui, fileobj, tmpname, tmpfp)

216

yield _extract(ui, fileobj, tmpname, tmpfp)

217

finally:

217

finally:

218

tmpfp.close()

218

tmpfp.close()

219

os.unlink(tmpname)

219

os.unlink(tmpname)

220

221

def _extract(ui, fileobj, tmpname, tmpfp):

221

def _extract(ui, fileobj, tmpname, tmpfp):

222

223

# attempt to detect the start of a patch

223

# attempt to detect the start of a patch

224

# (this heuristic is borrowed from quilt)

224

# (this heuristic is borrowed from quilt)

225

diffre = re.compile(br'^(?:Index:[ \t]|diff[ \t]-|RCS file: |'

225

diffre = re.compile(br'^(?:Index:[ \t]|diff[ \t]-|RCS file: |'

226

br'retrieving revision [0-9]+(\.[0-9]+)*$|'

226

br'retrieving revision [0-9]+(\.[0-9]+)*$|'

227

br'---[ \t].*?^\+\+\+[ \t]|'

227

br'---[ \t].*?^\+\+\+[ \t]|'

228

br'\*\*\*[ \t].*?^---[ \t])',

228

br'\*\*\*[ \t].*?^---[ \t])',

229

re.MULTILINE | re.DOTALL)

229

re.MULTILINE | re.DOTALL)

230

231

data = {}

231

data = {}

232

233

msg = mail.parse(fileobj)

233

msg = mail.parse(fileobj)

234

235

subject = msg[r'Subject'] and mail.headdecode(msg[r'Subject'])

235

subject = msg[r'Subject'] and mail.headdecode(msg[r'Subject'])

236

data['user'] = msg[r'From'] and mail.headdecode(msg[r'From'])

236

data['user'] = msg[r'From'] and mail.headdecode(msg[r'From'])

237

if not subject and not data['user']:

237

if not subject and not data['user']:

238

# Not an email, restore parsed headers if any

238

# Not an email, restore parsed headers if any

239

subject = '\n'.join(': '.join(map(encoding.strtolocal, h))

239

subject = '\n'.join(': '.join(map(encoding.strtolocal, h))

240

for h in msg.items()) + '\n'

240

for h in msg.items()) + '\n'

241

242

# should try to parse msg['Date']

242

# should try to parse msg['Date']

243

parents = []

243

parents = []

244

245

if subject:

245

if subject:

246

if subject.startswith('[PATCH'):

246

if subject.startswith('[PATCH'):

247

pend = subject.find(']')

247

pend = subject.find(']')

248

if pend >= 0:

248

if pend >= 0:

249

subject = subject[pend + 1:].lstrip()

249

subject = subject[pend + 1:].lstrip()

250

subject = re.sub(br'\n[ \t]+', ' ', subject)

250

subject = re.sub(br'\n[ \t]+', ' ', subject)

251

ui.debug('Subject: %s\n' % subject)

251

ui.debug('Subject: %s\n' % subject)

252

if data['user']:

252

if data['user']:

253

ui.debug('From: %s\n' % data['user'])

253

ui.debug('From: %s\n' % data['user'])

254

diffs_seen = 0

254

diffs_seen = 0

255

ok_types = ('text/plain', 'text/x-diff', 'text/x-patch')

255

ok_types = ('text/plain', 'text/x-diff', 'text/x-patch')

256

message = ''

256

message = ''

257

for part in msg.walk():

257

for part in msg.walk():

258

content_type = pycompat.bytestr(part.get_content_type())

258

content_type = pycompat.bytestr(part.get_content_type())

259

ui.debug('Content-Type: %s\n' % content_type)

259

ui.debug('Content-Type: %s\n' % content_type)

260

if content_type not in ok_types:

260

if content_type not in ok_types:

261

continue

261

continue

262

payload = part.get_payload(decode=True)

262

payload = part.get_payload(decode=True)

263

m = diffre.search(payload)

263

m = diffre.search(payload)

264

if m:

264

if m:

265

hgpatch = False

265

hgpatch = False

266

hgpatchheader = False

266

hgpatchheader = False

267

ignoretext = False

267

ignoretext = False

268

269

ui.debug('found patch at byte %d\n' % m.start(0))

269

ui.debug('found patch at byte %d\n' % m.start(0))

270

diffs_seen += 1

270

diffs_seen += 1

271

cfp = stringio()

271

cfp = stringio()

272

for line in payload[:m.start(0)].splitlines():

272

for line in payload[:m.start(0)].splitlines():

273

if line.startswith('# HG changeset patch') and not hgpatch:

273

if line.startswith('# HG changeset patch') and not hgpatch:

274

ui.debug('patch generated by hg export\n')

274

ui.debug('patch generated by hg export\n')

275

hgpatch = True

275

hgpatch = True

276

hgpatchheader = True

276

hgpatchheader = True

277

# drop earlier commit message content

277

# drop earlier commit message content

278

cfp.seek(0)

278

cfp.seek(0)

279

cfp.truncate()

279

cfp.truncate()

280

subject = None

280

subject = None

281

elif hgpatchheader:

281

elif hgpatchheader:

282

if line.startswith('# User '):

282

if line.startswith('# User '):

283

data['user'] = line[7:]

283

data['user'] = line[7:]

284

ui.debug('From: %s\n' % data['user'])

284

ui.debug('From: %s\n' % data['user'])

285

elif line.startswith("# Parent "):

285

elif line.startswith("# Parent "):

286

parents.append(line[9:].lstrip())

286

parents.append(line[9:].lstrip())

287

elif line.startswith("# "):

287

elif line.startswith("# "):

288

for header, key in patchheadermap:

288

for header, key in patchheadermap:

289

prefix = '# %s ' % header

289

prefix = '# %s ' % header

290

if line.startswith(prefix):

290

if line.startswith(prefix):

291

data[key] = line[len(prefix):]

291

data[key] = line[len(prefix):]

292

else:

292

else:

293

hgpatchheader = False

293

hgpatchheader = False

294

elif line == '---':

294

elif line == '---':

295

ignoretext = True

295

ignoretext = True

296

if not hgpatchheader and not ignoretext:

296

if not hgpatchheader and not ignoretext:

297

cfp.write(line)

297

cfp.write(line)

298

cfp.write('\n')

298

cfp.write('\n')

299

message = cfp.getvalue()

299

message = cfp.getvalue()

300

if tmpfp:

300

if tmpfp:

301

tmpfp.write(payload)

301

tmpfp.write(payload)

302

if not payload.endswith('\n'):

302

if not payload.endswith('\n'):

303

tmpfp.write('\n')

303

tmpfp.write('\n')

304

elif not diffs_seen and message and content_type == 'text/plain':

304

elif not diffs_seen and message and content_type == 'text/plain':

305

message += '\n' + payload

305

message += '\n' + payload

306

307

if subject and not message.startswith(subject):

307

if subject and not message.startswith(subject):

308

message = '%s\n%s' % (subject, message)

308

message = '%s\n%s' % (subject, message)

309

data['message'] = message

309

data['message'] = message

310

tmpfp.close()

310

tmpfp.close()

311

if parents:

311

if parents:

312

data['p1'] = parents.pop(0)

312

data['p1'] = parents.pop(0)

313

if parents:

313

if parents:

314

data['p2'] = parents.pop(0)

314

data['p2'] = parents.pop(0)

315

316

if diffs_seen:

316

if diffs_seen:

317

data['filename'] = tmpname

317

data['filename'] = tmpname

318

319

return data

319

return data

320

321

class patchmeta(object):

321

class patchmeta(object):

322

"""Patched file metadata

322

"""Patched file metadata

323

324

'op' is the performed operation within ADD, DELETE, RENAME, MODIFY

324

'op' is the performed operation within ADD, DELETE, RENAME, MODIFY

325

or COPY. 'path' is patched file path. 'oldpath' is set to the

325

or COPY. 'path' is patched file path. 'oldpath' is set to the

326

origin file when 'op' is either COPY or RENAME, None otherwise. If

326

origin file when 'op' is either COPY or RENAME, None otherwise. If

327

file mode is changed, 'mode' is a tuple (islink, isexec) where

327

file mode is changed, 'mode' is a tuple (islink, isexec) where

328

'islink' is True if the file is a symlink and 'isexec' is True if

328

'islink' is True if the file is a symlink and 'isexec' is True if

329

the file is executable. Otherwise, 'mode' is None.

329

the file is executable. Otherwise, 'mode' is None.

330

"""

330

"""

331

def __init__(self, path):

331

def __init__(self, path):

332

self.path = path

332

self.path = path

333

self.oldpath = None

333

self.oldpath = None

334

self.mode = None

334

self.mode = None

335

self.op = 'MODIFY'

335

self.op = 'MODIFY'

336

self.binary = False

336

self.binary = False

337

338

def setmode(self, mode):

338

def setmode(self, mode):

339

islink = mode & 0o20000

339

islink = mode & 0o20000

340

isexec = mode & 0o100

340

isexec = mode & 0o100

341

self.mode = (islink, isexec)

341

self.mode = (islink, isexec)

342

343

def copy(self):

343

def copy(self):

344

other = patchmeta(self.path)

344

other = patchmeta(self.path)

345

other.oldpath = self.oldpath

345

other.oldpath = self.oldpath

346

other.mode = self.mode

346

other.mode = self.mode

347

other.op = self.op

347

other.op = self.op

348

other.binary = self.binary

348

other.binary = self.binary

349

return other

349

return other

350

351

def _ispatchinga(self, afile):

351

def _ispatchinga(self, afile):

352

if afile == '/dev/null':

352

if afile == '/dev/null':

353

return self.op == 'ADD'

353

return self.op == 'ADD'

354

return afile == 'a/' + (self.oldpath or self.path)

354

return afile == 'a/' + (self.oldpath or self.path)

355

356

def _ispatchingb(self, bfile):

356

def _ispatchingb(self, bfile):

357

if bfile == '/dev/null':

357

if bfile == '/dev/null':

358

return self.op == 'DELETE'

358

return self.op == 'DELETE'

359

return bfile == 'b/' + self.path

359

return bfile == 'b/' + self.path

360

361

def ispatching(self, afile, bfile):

361

def ispatching(self, afile, bfile):

362

return self._ispatchinga(afile) and self._ispatchingb(bfile)

362

return self._ispatchinga(afile) and self._ispatchingb(bfile)

363

364

def __repr__(self):

364

def __repr__(self):

365

return r"<patchmeta %s %r>" % (self.op, self.path)

365

return r"<patchmeta %s %r>" % (self.op, self.path)

366

367

def readgitpatch(lr):

367

def readgitpatch(lr):

368

"""extract git-style metadata about patches from <patchname>"""

368

"""extract git-style metadata about patches from <patchname>"""

369

370

# Filter patch for git information

370

# Filter patch for git information

371

gp = None

371

gp = None

372

gitpatches = []

372

gitpatches = []

373

for line in lr:

373

for line in lr:

374

line = line.rstrip(' \r\n')

374

line = line.rstrip(' \r\n')

375

if line.startswith('diff --git a/'):

375

if line.startswith('diff --git a/'):

376

m = gitre.match(line)

376

m = gitre.match(line)

377

if m:

377

if m:

378

if gp:

378

if gp:

379

gitpatches.append(gp)

379

gitpatches.append(gp)

380

dst = m.group(2)

380

dst = m.group(2)

381

gp = patchmeta(dst)

381

gp = patchmeta(dst)

382

elif gp:

382

elif gp:

383

if line.startswith('--- '):

383

if line.startswith('--- '):

384

gitpatches.append(gp)

384

gitpatches.append(gp)

385

gp = None

385

gp = None

386

continue

386

continue

387

if line.startswith('rename from '):

387

if line.startswith('rename from '):

388

gp.op = 'RENAME'

388

gp.op = 'RENAME'

389

gp.oldpath = line[12:]

389

gp.oldpath = line[12:]

390

elif line.startswith('rename to '):

390

elif line.startswith('rename to '):

391

gp.path = line[10:]

391

gp.path = line[10:]

392

elif line.startswith('copy from '):

392

elif line.startswith('copy from '):

393

gp.op = 'COPY'

393

gp.op = 'COPY'

394

gp.oldpath = line[10:]

394

gp.oldpath = line[10:]

395

elif line.startswith('copy to '):

395

elif line.startswith('copy to '):

396

gp.path = line[8:]

396

gp.path = line[8:]

397

elif line.startswith('deleted file'):

397

elif line.startswith('deleted file'):

398

gp.op = 'DELETE'

398

gp.op = 'DELETE'

399

elif line.startswith('new file mode '):

399

elif line.startswith('new file mode '):

400

gp.op = 'ADD'

400

gp.op = 'ADD'

401

gp.setmode(int(line[-6:], 8))

401

gp.setmode(int(line[-6:], 8))

402

elif line.startswith('new mode '):

402

elif line.startswith('new mode '):

403

gp.setmode(int(line[-6:], 8))

403

gp.setmode(int(line[-6:], 8))

404

elif line.startswith('GIT binary patch'):

404

elif line.startswith('GIT binary patch'):

405

gp.binary = True

405

gp.binary = True

406

if gp:

406

if gp:

407

gitpatches.append(gp)

407

gitpatches.append(gp)

408

409

return gitpatches

409

return gitpatches

410

411

class linereader(object):

411

class linereader(object):

412

# simple class to allow pushing lines back into the input stream

412

# simple class to allow pushing lines back into the input stream

413

def __init__(self, fp):

413

def __init__(self, fp):

414

self.fp = fp

414

self.fp = fp

415

self.buf = []

415

self.buf = []

416

417

def push(self, line):

417

def push(self, line):

418

if line is not None:

418

if line is not None:

419

self.buf.append(line)

419

self.buf.append(line)

420

421

def readline(self):

421

def readline(self):

422

if self.buf:

422

if self.buf:

423

l = self.buf[0]

423

l = self.buf[0]

424

del self.buf[0]

424

del self.buf[0]

425

return l

425

return l

426

return self.fp.readline()

426

return self.fp.readline()

427

428

def __iter__(self):

428

def __iter__(self):

429

return iter(self.readline, '')

429

return iter(self.readline, '')

430

431

class abstractbackend(object):

431

class abstractbackend(object):

432

def __init__(self, ui):

432

def __init__(self, ui):

433

self.ui = ui

433

self.ui = ui

434

435

def getfile(self, fname):

435

def getfile(self, fname):

436

"""Return target file data and flags as a (data, (islink,

436

"""Return target file data and flags as a (data, (islink,

437

isexec)) tuple. Data is None if file is missing/deleted.

437

isexec)) tuple. Data is None if file is missing/deleted.

438

"""

438

"""

439

raise NotImplementedError

439

raise NotImplementedError

440

441

def setfile(self, fname, data, mode, copysource):

441

def setfile(self, fname, data, mode, copysource):

442

"""Write data to target file fname and set its mode. mode is a

442

"""Write data to target file fname and set its mode. mode is a

443

(islink, isexec) tuple. If data is None, the file content should

443

(islink, isexec) tuple. If data is None, the file content should

444

be left unchanged. If the file is modified after being copied,

444

be left unchanged. If the file is modified after being copied,

445

copysource is set to the original file name.

445

copysource is set to the original file name.

446

"""

446

"""

447

raise NotImplementedError

447

raise NotImplementedError

448

449

def unlink(self, fname):

449

def unlink(self, fname):

450

"""Unlink target file."""

450

"""Unlink target file."""

451

raise NotImplementedError

451

raise NotImplementedError

452

453

def writerej(self, fname, failed, total, lines):

453

def writerej(self, fname, failed, total, lines):

454

"""Write rejected lines for fname. total is the number of hunks

454

"""Write rejected lines for fname. total is the number of hunks

455

which failed to apply and total the total number of hunks for this

455

which failed to apply and total the total number of hunks for this

456

files.

456

files.

457

"""

457

"""

458

459

def exists(self, fname):

459

def exists(self, fname):

460

raise NotImplementedError

460

raise NotImplementedError

461

462

def close(self):

462

def close(self):

463

raise NotImplementedError

463

raise NotImplementedError

464

465

class fsbackend(abstractbackend):

465

class fsbackend(abstractbackend):

466

def __init__(self, ui, basedir):

466

def __init__(self, ui, basedir):

467

super(fsbackend, self).__init__(ui)

467

super(fsbackend, self).__init__(ui)

468

self.opener = vfsmod.vfs(basedir)

468

self.opener = vfsmod.vfs(basedir)

469

470

def getfile(self, fname):

470

def getfile(self, fname):

471

if self.opener.islink(fname):

471

if self.opener.islink(fname):

472

return (self.opener.readlink(fname), (True, False))

472

return (self.opener.readlink(fname), (True, False))

473

474

isexec = False

474

isexec = False

475

try:

475

try:

476

isexec = self.opener.lstat(fname).st_mode & 0o100 != 0

476

isexec = self.opener.lstat(fname).st_mode & 0o100 != 0

477

except OSError as e:

477

except OSError as e:

478

if e.errno != errno.ENOENT:

478

if e.errno != errno.ENOENT:

479

raise

479

raise

480

try:

480

try:

481

return (self.opener.read(fname), (False, isexec))

481

return (self.opener.read(fname), (False, isexec))

482

except IOError as e:

482

except IOError as e:

483

if e.errno != errno.ENOENT:

483

if e.errno != errno.ENOENT:

484

raise

484

raise

485

return None, None

485

return None, None

486

487

def setfile(self, fname, data, mode, copysource):

487

def setfile(self, fname, data, mode, copysource):

488

islink, isexec = mode

488

islink, isexec = mode

489

if data is None:

489

if data is None:

490

self.opener.setflags(fname, islink, isexec)

490

self.opener.setflags(fname, islink, isexec)

491

return

491

return

492

if islink:

492

if islink:

493

self.opener.symlink(data, fname)

493

self.opener.symlink(data, fname)

494

else:

494

else:

495

self.opener.write(fname, data)

495

self.opener.write(fname, data)

496

if isexec:

496

if isexec:

497

self.opener.setflags(fname, False, True)

497

self.opener.setflags(fname, False, True)

498

499

def unlink(self, fname):

499

def unlink(self, fname):

500

rmdir = self.ui.configbool('experimental', 'removeemptydirs')

500

rmdir = self.ui.configbool('experimental', 'removeemptydirs')

501

self.opener.unlinkpath(fname, ignoremissing=True, rmdir=rmdir)

501

self.opener.unlinkpath(fname, ignoremissing=True, rmdir=rmdir)

502

503

def writerej(self, fname, failed, total, lines):

503

def writerej(self, fname, failed, total, lines):

504

fname = fname + ".rej"

504

fname = fname + ".rej"

505

self.ui.warn(

505

self.ui.warn(

506

_("%d out of %d hunks FAILED -- saving rejects to file %s\n") %

506

_("%d out of %d hunks FAILED -- saving rejects to file %s\n") %

507

(failed, total, fname))

507

(failed, total, fname))

508

fp = self.opener(fname, 'w')

508

fp = self.opener(fname, 'w')

509

fp.writelines(lines)

509

fp.writelines(lines)

510

fp.close()

510

fp.close()

511

512

def exists(self, fname):

512

def exists(self, fname):

513

return self.opener.lexists(fname)

513

return self.opener.lexists(fname)

514

515

class workingbackend(fsbackend):

515

class workingbackend(fsbackend):

516

def __init__(self, ui, repo, similarity):

516

def __init__(self, ui, repo, similarity):

517

super(workingbackend, self).__init__(ui, repo.root)

517

super(workingbackend, self).__init__(ui, repo.root)

518

self.repo = repo

518

self.repo = repo

519

self.similarity = similarity

519

self.similarity = similarity

520

self.removed = set()

520

self.removed = set()

521

self.changed = set()

521

self.changed = set()

522

self.copied = []

522

self.copied = []

523

524

def _checkknown(self, fname):

524

def _checkknown(self, fname):

525

if self.repo.dirstate[fname] == '?' and self.exists(fname):

525

if self.repo.dirstate[fname] == '?' and self.exists(fname):

526

raise PatchError(_('cannot patch %s: file is not tracked') % fname)

526

raise PatchError(_('cannot patch %s: file is not tracked') % fname)

527

528

def setfile(self, fname, data, mode, copysource):

528

def setfile(self, fname, data, mode, copysource):

529

self._checkknown(fname)

529

self._checkknown(fname)

530

super(workingbackend, self).setfile(fname, data, mode, copysource)

530

super(workingbackend, self).setfile(fname, data, mode, copysource)

531

if copysource is not None:

531

if copysource is not None:

532

self.copied.append((copysource, fname))

532

self.copied.append((copysource, fname))

533

self.changed.add(fname)

533

self.changed.add(fname)

534

535

def unlink(self, fname):

535

def unlink(self, fname):

536

self._checkknown(fname)

536

self._checkknown(fname)

537

super(workingbackend, self).unlink(fname)

537

super(workingbackend, self).unlink(fname)

538

self.removed.add(fname)

538

self.removed.add(fname)

539

self.changed.add(fname)

539

self.changed.add(fname)

540

541

def close(self):

541

def close(self):

542

wctx = self.repo[None]

542

wctx = self.repo[None]

543

changed = set(self.changed)

543

changed = set(self.changed)

544

for src, dst in self.copied:

544

for src, dst in self.copied:

545

scmutil.dirstatecopy(self.ui, self.repo, wctx, src, dst)

545

scmutil.dirstatecopy(self.ui, self.repo, wctx, src, dst)

546

if self.removed:

546

if self.removed:

547

wctx.forget(sorted(self.removed))

547

wctx.forget(sorted(self.removed))

548

for f in self.removed:

548

for f in self.removed:

549

if f not in self.repo.dirstate:

549

if f not in self.repo.dirstate:

550

# File was deleted and no longer belongs to the

550

# File was deleted and no longer belongs to the

551

# dirstate, it was probably marked added then

551

# dirstate, it was probably marked added then

552

# deleted, and should not be considered by

552

# deleted, and should not be considered by

553

# marktouched().

553

# marktouched().

554

changed.discard(f)

554

changed.discard(f)

555

if changed:

555

if changed:

556

scmutil.marktouched(self.repo, changed, self.similarity)

556

scmutil.marktouched(self.repo, changed, self.similarity)

557

return sorted(self.changed)

557

return sorted(self.changed)

558

559

class filestore(object):

559

class filestore(object):

560

def __init__(self, maxsize=None):

560

def __init__(self, maxsize=None):

561

self.opener = None

561

self.opener = None

562

self.files = {}

562

self.files = {}

563

self.created = 0

563

self.created = 0

564

self.maxsize = maxsize

564

self.maxsize = maxsize

565

if self.maxsize is None:

565

if self.maxsize is None:

566

self.maxsize = 4*(2**20)

566

self.maxsize = 4*(2**20)

567

self.size = 0

567

self.size = 0

568

self.data = {}

568

self.data = {}

569

570

def setfile(self, fname, data, mode, copied=None):

570

def setfile(self, fname, data, mode, copied=None):

571

if self.maxsize < 0 or (len(data) + self.size) <= self.maxsize:

571

if self.maxsize < 0 or (len(data) + self.size) <= self.maxsize:

572

self.data[fname] = (data, mode, copied)

572

self.data[fname] = (data, mode, copied)

573

self.size += len(data)

573

self.size += len(data)

574

else:

574

else:

575

if self.opener is None:

575

if self.opener is None:

576

root = pycompat.mkdtemp(prefix='hg-patch-')

576

root = pycompat.mkdtemp(prefix='hg-patch-')

577

self.opener = vfsmod.vfs(root)

577

self.opener = vfsmod.vfs(root)

578

# Avoid filename issues with these simple names

578

# Avoid filename issues with these simple names

579

fn = '%d' % self.created

579

fn = '%d' % self.created

580

self.opener.write(fn, data)

580

self.opener.write(fn, data)

581

self.created += 1

581

self.created += 1

582

self.files[fname] = (fn, mode, copied)

582

self.files[fname] = (fn, mode, copied)

583

584

def getfile(self, fname):

584

def getfile(self, fname):

585

if fname in self.data:

585

if fname in self.data:

586

return self.data[fname]

586

return self.data[fname]

587

if not self.opener or fname not in self.files:

587

if not self.opener or fname not in self.files:

588

return None, None, None

588

return None, None, None

589

fn, mode, copied = self.files[fname]

589

fn, mode, copied = self.files[fname]

590

return self.opener.read(fn), mode, copied

590

return self.opener.read(fn), mode, copied

591

592

def close(self):

592

def close(self):

593

if self.opener:

593

if self.opener:

594

shutil.rmtree(self.opener.base)

594

shutil.rmtree(self.opener.base)

595

596

class repobackend(abstractbackend):

596

class repobackend(abstractbackend):

597

def __init__(self, ui, repo, ctx, store):

597

def __init__(self, ui, repo, ctx, store):

598

super(repobackend, self).__init__(ui)

598

super(repobackend, self).__init__(ui)

599

self.repo = repo

599

self.repo = repo

600

self.ctx = ctx

600

self.ctx = ctx

601

self.store = store

601

self.store = store

602

self.changed = set()

602

self.changed = set()

603

self.removed = set()

603

self.removed = set()

604

self.copied = {}

604

self.copied = {}

605

606

def _checkknown(self, fname):

606

def _checkknown(self, fname):

607

if fname not in self.ctx:

607

if fname not in self.ctx:

608

raise PatchError(_('cannot patch %s: file is not tracked') % fname)

608

raise PatchError(_('cannot patch %s: file is not tracked') % fname)

609

610

def getfile(self, fname):

610

def getfile(self, fname):

611

try:

611

try:

612

fctx = self.ctx[fname]

612

fctx = self.ctx[fname]

613

except error.LookupError:

613

except error.LookupError:

614

return None, None

614

return None, None

615

flags = fctx.flags()

615

flags = fctx.flags()

616

return fctx.data(), ('l' in flags, 'x' in flags)

616

return fctx.data(), ('l' in flags, 'x' in flags)

617

618

def setfile(self, fname, data, mode, copysource):

618

def setfile(self, fname, data, mode, copysource):

619

if copysource:

619

if copysource:

620

self._checkknown(copysource)

620

self._checkknown(copysource)

621

if data is None:

621

if data is None:

622

data = self.ctx[fname].data()

622

data = self.ctx[fname].data()

623

self.store.setfile(fname, data, mode, copysource)

623

self.store.setfile(fname, data, mode, copysource)

624

self.changed.add(fname)

624

self.changed.add(fname)

625

if copysource:

625

if copysource:

626

self.copied[fname] = copysource

626

self.copied[fname] = copysource

627

628

def unlink(self, fname):

628

def unlink(self, fname):

629

self._checkknown(fname)

629

self._checkknown(fname)

630

self.removed.add(fname)

630

self.removed.add(fname)

631

632

def exists(self, fname):

632

def exists(self, fname):

633

return fname in self.ctx

633

return fname in self.ctx

634

635

def close(self):

635

def close(self):

636

return self.changed | self.removed

636

return self.changed | self.removed

637

638

# @@ -start,len +start,len @@ or @@ -start +start @@ if len is 1

638

# @@ -start,len +start,len @@ or @@ -start +start @@ if len is 1

639

unidesc = re.compile(br'@@ -(\d+)(?:,(\d+))? \+(\d+)(?:,(\d+))? @@')

639

unidesc = re.compile(br'@@ -(\d+)(?:,(\d+))? \+(\d+)(?:,(\d+))? @@')

640

contextdesc = re.compile(br'(?:---|\*\*\*) (\d+)(?:,(\d+))? (?:---|\*\*\*)')

640

contextdesc = re.compile(br'(?:---|\*\*\*) (\d+)(?:,(\d+))? (?:---|\*\*\*)')

641

eolmodes = ['strict', 'crlf', 'lf', 'auto']

641

eolmodes = ['strict', 'crlf', 'lf', 'auto']

642

643

class patchfile(object):

643

class patchfile(object):

644

def __init__(self, ui, gp, backend, store, eolmode='strict'):

644

def __init__(self, ui, gp, backend, store, eolmode='strict'):

645

self.fname = gp.path

645

self.fname = gp.path

646

self.eolmode = eolmode

646

self.eolmode = eolmode

647

self.eol = None

647

self.eol = None

648

self.backend = backend

648

self.backend = backend

649

self.ui = ui

649

self.ui = ui

650

self.lines = []

650

self.lines = []

651

self.exists = False

651

self.exists = False

652

self.missing = True

652

self.missing = True

653

self.mode = gp.mode

653

self.mode = gp.mode

654

self.copysource = gp.oldpath

654

self.copysource = gp.oldpath

655

self.create = gp.op in ('ADD', 'COPY', 'RENAME')

655

self.create = gp.op in ('ADD', 'COPY', 'RENAME')

656

self.remove = gp.op == 'DELETE'

656

self.remove = gp.op == 'DELETE'

657

if self.copysource is None:

657

if self.copysource is None:

658

data, mode = backend.getfile(self.fname)

658

data, mode = backend.getfile(self.fname)

659

else:

659

else:

660

data, mode = store.getfile(self.copysource)[:2]

660

data, mode = store.getfile(self.copysource)[:2]

661

if data is not None:

661

if data is not None:

662

self.exists = self.copysource is None or backend.exists(self.fname)

662

self.exists = self.copysource is None or backend.exists(self.fname)

663

self.missing = False

663

self.missing = False

664

if data:

664

if data:

665

self.lines = mdiff.splitnewlines(data)

665

self.lines = mdiff.splitnewlines(data)

666

if self.mode is None:

666

if self.mode is None:

667

self.mode = mode

667

self.mode = mode

668

if self.lines:

668

if self.lines:

669

# Normalize line endings

669

# Normalize line endings

670

if self.lines[0].endswith('\r\n'):

670

if self.lines[0].endswith('\r\n'):

671

self.eol = '\r\n'

671

self.eol = '\r\n'

672

elif self.lines[0].endswith('\n'):

672

elif self.lines[0].endswith('\n'):

673

self.eol = '\n'

673

self.eol = '\n'

674

if eolmode != 'strict':

674

if eolmode != 'strict':

675

nlines = []

675

nlines = []

676

for l in self.lines:

676

for l in self.lines:

677

if l.endswith('\r\n'):

677

if l.endswith('\r\n'):

678

l = l[:-2] + '\n'

678

l = l[:-2] + '\n'

679

nlines.append(l)

679

nlines.append(l)

680

self.lines = nlines

680

self.lines = nlines

681

else:

681

else:

682

if self.create:

682

if self.create:

683

self.missing = False

683

self.missing = False

684

if self.mode is None:

684

if self.mode is None:

685

self.mode = (False, False)

685

self.mode = (False, False)

686

if self.missing:

686

if self.missing:

687

self.ui.warn(_("unable to find '%s' for patching\n") % self.fname)

687

self.ui.warn(_("unable to find '%s' for patching\n") % self.fname)

688

self.ui.warn(_("(use '--prefix' to apply patch relative to the "

688

self.ui.warn(_("(use '--prefix' to apply patch relative to the "

689

"current directory)\n"))

689

"current directory)\n"))

690

691

self.hash = {}

691

self.hash = {}

692

self.dirty = 0

692

self.dirty = 0

693

self.offset = 0

693

self.offset = 0

694

self.skew = 0

694

self.skew = 0

695

self.rej = []

695

self.rej = []

696

self.fileprinted = False

696

self.fileprinted = False

697

self.printfile(False)

697

self.printfile(False)

698

self.hunks = 0

698

self.hunks = 0

699

700

def writelines(self, fname, lines, mode):

700

def writelines(self, fname, lines, mode):

701

if self.eolmode == 'auto':

701

if self.eolmode == 'auto':

702

eol = self.eol

702

eol = self.eol

703

elif self.eolmode == 'crlf':

703

elif self.eolmode == 'crlf':

704

eol = '\r\n'

704

eol = '\r\n'

705

else:

705

else:

706

eol = '\n'

706

eol = '\n'

707

708

if self.eolmode != 'strict' and eol and eol != '\n':

708

if self.eolmode != 'strict' and eol and eol != '\n':

709

rawlines = []

709

rawlines = []

710

for l in lines:

710

for l in lines:

711

if l and l.endswith('\n'):

711

if l and l.endswith('\n'):

712

l = l[:-1] + eol

712

l = l[:-1] + eol

713

rawlines.append(l)

713

rawlines.append(l)

714

lines = rawlines

714

lines = rawlines

715

716

self.backend.setfile(fname, ''.join(lines), mode, self.copysource)

716

self.backend.setfile(fname, ''.join(lines), mode, self.copysource)

717

718

def printfile(self, warn):

718

def printfile(self, warn):

719

if self.fileprinted:

719

if self.fileprinted:

720

return

720

return

721

if warn or self.ui.verbose:

721

if warn or self.ui.verbose:

722

self.fileprinted = True

722

self.fileprinted = True

723

s = _("patching file %s\n") % self.fname

723

s = _("patching file %s\n") % self.fname

724

if warn:

724

if warn:

725

self.ui.warn(s)

725

self.ui.warn(s)

726

else:

726

else:

727

self.ui.note(s)

727

self.ui.note(s)

728

729

730

def findlines(self, l, linenum):

730

def findlines(self, l, linenum):

731

# looks through the hash and finds candidate lines. The

731

# looks through the hash and finds candidate lines. The

732

# result is a list of line numbers sorted based on distance

732

# result is a list of line numbers sorted based on distance

733

# from linenum

733

# from linenum

734

735

cand = self.hash.get(l, [])

735

cand = self.hash.get(l, [])

736

if len(cand) > 1:

736

if len(cand) > 1:

737

# resort our list of potentials forward then back.

737

# resort our list of potentials forward then back.

738

cand.sort(key=lambda x: abs(x - linenum))

738

cand.sort(key=lambda x: abs(x - linenum))

739

return cand

739

return cand

740

741

def write_rej(self):

741

def write_rej(self):

742

# our rejects are a little different from patch(1). This always

742

# our rejects are a little different from patch(1). This always

743

# creates rejects in the same form as the original patch. A file

743

# creates rejects in the same form as the original patch. A file

744

# header is inserted so that you can run the reject through patch again

744

# header is inserted so that you can run the reject through patch again

745

# without having to type the filename.

745

# without having to type the filename.

746

if not self.rej:

746

if not self.rej:

747

return

747

return

748

base = os.path.basename(self.fname)

748

base = os.path.basename(self.fname)

749

lines = ["--- %s\n+++ %s\n" % (base, base)]

749

lines = ["--- %s\n+++ %s\n" % (base, base)]

750

for x in self.rej:

750

for x in self.rej:

751

for l in x.hunk:

751

for l in x.hunk:

752

lines.append(l)

752

lines.append(l)

753

if l[-1:] != '\n':

753

if l[-1:] != '\n':

754

lines.append("\n\\ No newline at end of file\n")

754

lines.append("\n\\ No newline at end of file\n")

755

self.backend.writerej(self.fname, len(self.rej), self.hunks, lines)

755

self.backend.writerej(self.fname, len(self.rej), self.hunks, lines)

756

757

def apply(self, h):

757

def apply(self, h):

758

if not h.complete():

758

if not h.complete():

759

raise PatchError(_("bad hunk #%d %s (%d %d %d %d)") %

759

raise PatchError(_("bad hunk #%d %s (%d %d %d %d)") %

760

(h.number, h.desc, len(h.a), h.lena, len(h.b),

760

(h.number, h.desc, len(h.a), h.lena, len(h.b),

761

h.lenb))

761

h.lenb))

762

763

self.hunks += 1

763

self.hunks += 1

764

765

if self.missing:

765

if self.missing:

766

self.rej.append(h)

766

self.rej.append(h)

767

return -1

767

return -1

768

769

if self.exists and self.create:

769

if self.exists and self.create:

770

if self.copysource:

770

if self.copysource:

771

self.ui.warn(_("cannot create %s: destination already "

771

self.ui.warn(_("cannot create %s: destination already "

772

"exists\n") % self.fname)

772

"exists\n") % self.fname)

773

else:

773

else:

774

self.ui.warn(_("file %s already exists\n") % self.fname)

774

self.ui.warn(_("file %s already exists\n") % self.fname)

775

self.rej.append(h)

775

self.rej.append(h)

776

return -1

776

return -1

777

778

if isinstance(h, binhunk):

778

if isinstance(h, binhunk):

779

if self.remove:

779

if self.remove:

780

self.backend.unlink(self.fname)

780

self.backend.unlink(self.fname)

781

else:

781

else:

782

l = h.new(self.lines)

782

l = h.new(self.lines)

783

self.lines[:] = l

783

self.lines[:] = l

784

self.offset += len(l)

784

self.offset += len(l)

785

self.dirty = True

785

self.dirty = True

786

return 0

786

return 0

787

788

horig = h

788

horig = h

789

if (self.eolmode in ('crlf', 'lf')

789

if (self.eolmode in ('crlf', 'lf')

790

or self.eolmode == 'auto' and self.eol):

790

or self.eolmode == 'auto' and self.eol):

791

# If new eols are going to be normalized, then normalize

791

# If new eols are going to be normalized, then normalize

792

# hunk data before patching. Otherwise, preserve input

792

# hunk data before patching. Otherwise, preserve input

793

# line-endings.

793

# line-endings.

794

h = h.getnormalized()

794

h = h.getnormalized()

795

796

# fast case first, no offsets, no fuzz

796

# fast case first, no offsets, no fuzz

797

old, oldstart, new, newstart = h.fuzzit(0, False)

797

old, oldstart, new, newstart = h.fuzzit(0, False)

798

oldstart += self.offset

798

oldstart += self.offset

799

orig_start = oldstart

799

orig_start = oldstart

800

# if there's skew we want to emit the "(offset %d lines)" even

800

# if there's skew we want to emit the "(offset %d lines)" even

801

# when the hunk cleanly applies at start + skew, so skip the

801

# when the hunk cleanly applies at start + skew, so skip the

802

# fast case code

802

# fast case code

803

if self.skew == 0 and diffhelper.testhunk(old, self.lines, oldstart):

803

if self.skew == 0 and diffhelper.testhunk(old, self.lines, oldstart):

804

if self.remove:

804

if self.remove:

805

self.backend.unlink(self.fname)

805

self.backend.unlink(self.fname)

806

else:

806

else:

807

self.lines[oldstart:oldstart + len(old)] = new

807

self.lines[oldstart:oldstart + len(old)] = new

808

self.offset += len(new) - len(old)

808

self.offset += len(new) - len(old)

809

self.dirty = True

809

self.dirty = True

810

return 0

810

return 0

811

812

# ok, we couldn't match the hunk. Lets look for offsets and fuzz it

812

# ok, we couldn't match the hunk. Lets look for offsets and fuzz it

813

self.hash = {}

813

self.hash = {}

814

for x, s in enumerate(self.lines):

814

for x, s in enumerate(self.lines):

815

self.hash.setdefault(s, []).append(x)

815

self.hash.setdefault(s, []).append(x)

816

817

for fuzzlen in pycompat.xrange(self.ui.configint("patch", "fuzz") + 1):

817

for fuzzlen in pycompat.xrange(self.ui.configint("patch", "fuzz") + 1):

818

for toponly in [True, False]:

818

for toponly in [True, False]:

819

old, oldstart, new, newstart = h.fuzzit(fuzzlen, toponly)

819

old, oldstart, new, newstart = h.fuzzit(fuzzlen, toponly)

820

oldstart = oldstart + self.offset + self.skew

820

oldstart = oldstart + self.offset + self.skew

821

oldstart = min(oldstart, len(self.lines))

821

oldstart = min(oldstart, len(self.lines))

822

if old:

822

if old:

823

cand = self.findlines(old[0][1:], oldstart)

823

cand = self.findlines(old[0][1:], oldstart)

824

else:

824

else:

825

# Only adding lines with no or fuzzed context, just

825

# Only adding lines with no or fuzzed context, just

826

# take the skew in account

826

# take the skew in account

827

cand = [oldstart]

827

cand = [oldstart]

828

829

for l in cand:

829

for l in cand:

830

if not old or diffhelper.testhunk(old, self.lines, l):

830

if not old or diffhelper.testhunk(old, self.lines, l):

831

self.lines[l : l + len(old)] = new

831

self.lines[l : l + len(old)] = new

832

self.offset += len(new) - len(old)

832

self.offset += len(new) - len(old)

833

self.skew = l - orig_start

833

self.skew = l - orig_start

834

self.dirty = True

834

self.dirty = True

835

offset = l - orig_start - fuzzlen

835

offset = l - orig_start - fuzzlen

836

if fuzzlen:

836

if fuzzlen:

837

msg = _("Hunk #%d succeeded at %d "

837

msg = _("Hunk #%d succeeded at %d "

838

"with fuzz %d "

838

"with fuzz %d "

839

"(offset %d lines).\n")

839

"(offset %d lines).\n")

840

self.printfile(True)

840

self.printfile(True)

841

self.ui.warn(msg %

841

self.ui.warn(msg %

842

(h.number, l + 1, fuzzlen, offset))

842

(h.number, l + 1, fuzzlen, offset))

843

else:

843

else:

844

msg = _("Hunk #%d succeeded at %d "

844

msg = _("Hunk #%d succeeded at %d "

845

"(offset %d lines).\n")

845

"(offset %d lines).\n")

846

self.ui.note(msg % (h.number, l + 1, offset))

846

self.ui.note(msg % (h.number, l + 1, offset))

847

return fuzzlen

847

return fuzzlen

848

self.printfile(True)

848

self.printfile(True)

849

self.ui.warn(_("Hunk #%d FAILED at %d\n") % (h.number, orig_start))

849

self.ui.warn(_("Hunk #%d FAILED at %d\n") % (h.number, orig_start))

850

self.rej.append(horig)

850

self.rej.append(horig)

851

return -1

851

return -1

852

853

def close(self):

853

def close(self):

854

if self.dirty:

854

if self.dirty:

855

self.writelines(self.fname, self.lines, self.mode)

855

self.writelines(self.fname, self.lines, self.mode)

856

self.write_rej()

856

self.write_rej()

857

return len(self.rej)

857

return len(self.rej)

858

859

class header(object):

859

class header(object):

860

"""patch header

860

"""patch header

861

"""

861

"""

862

diffgit_re = re.compile('diff --git a/(.*) b/(.*)$')

862

diffgit_re = re.compile('diff --git a/(.*) b/(.*)$')

863

diff_re = re.compile('diff -r .* (.*)$')

863

diff_re = re.compile('diff -r .* (.*)$')

864

allhunks_re = re.compile('(?:index|deleted file) ')

864

allhunks_re = re.compile('(?:index|deleted file) ')

865

pretty_re = re.compile('(?:new file|deleted file) ')

865

pretty_re = re.compile('(?:new file|deleted file) ')

866

special_re = re.compile('(?:index|deleted|copy|rename|new mode) ')

866

special_re = re.compile('(?:index|deleted|copy|rename|new mode) ')

867

newfile_re = re.compile('(?:new file)')

867

newfile_re = re.compile('(?:new file)')

868

869

def __init__(self, header):

869

def __init__(self, header):

870

self.header = header

870

self.header = header

871

self.hunks = []

871

self.hunks = []

872

873

def binary(self):

873

def binary(self):

874

return any(h.startswith('index ') for h in self.header)

874

return any(h.startswith('index ') for h in self.header)

875

876

def pretty(self, fp):

876

def pretty(self, fp):

877

for h in self.header:

877

for h in self.header:

878

if h.startswith('index '):

878

if h.startswith('index '):

879

fp.write(_('this modifies a binary file (all or nothing)\n'))

879

fp.write(_('this modifies a binary file (all or nothing)\n'))

880

break

880

break

881

if self.pretty_re.match(h):

881

if self.pretty_re.match(h):

882

fp.write(h)

882

fp.write(h)

883

if self.binary():

883

if self.binary():

884

fp.write(_('this is a binary file\n'))

884

fp.write(_('this is a binary file\n'))

885

break

885

break

886

if h.startswith('---'):

886

if h.startswith('---'):

887

fp.write(_('%d hunks, %d lines changed\n') %

887

fp.write(_('%d hunks, %d lines changed\n') %

888

(len(self.hunks),

888

(len(self.hunks),

889

sum([max(h.added, h.removed) for h in self.hunks])))

889

sum([max(h.added, h.removed) for h in self.hunks])))

890

break

890

break

891

fp.write(h)

891

fp.write(h)

892

893

def write(self, fp):

893

def write(self, fp):

894

fp.write(''.join(self.header))

894

fp.write(''.join(self.header))

895

896

def allhunks(self):

896

def allhunks(self):

897

return any(self.allhunks_re.match(h) for h in self.header)

897

return any(self.allhunks_re.match(h) for h in self.header)

898

899

def files(self):

899

def files(self):

900

match = self.diffgit_re.match(self.header[0])

900

match = self.diffgit_re.match(self.header[0])

901

if match:

901

if match:

902

fromfile, tofile = match.groups()

902

fromfile, tofile = match.groups()

903

if fromfile == tofile:

903

if fromfile == tofile:

904

return [fromfile]

904

return [fromfile]

905

return [fromfile, tofile]

905

return [fromfile, tofile]

906

else:

906

else:

907

return self.diff_re.match(self.header[0]).groups()

907

return self.diff_re.match(self.header[0]).groups()

908

909

def filename(self):

909

def filename(self):

910

return self.files()[-1]

910

return self.files()[-1]

911

912

def __repr__(self):

912

def __repr__(self):

913

return '<header %s>' % (' '.join(map(repr, self.files())))

913

return '<header %s>' % (' '.join(map(repr, self.files())))

914

915

def isnewfile(self):

915

def isnewfile(self):

916

return any(self.newfile_re.match(h) for h in self.header)

916

return any(self.newfile_re.match(h) for h in self.header)

917

918

def special(self):

918

def special(self):

919

# Special files are shown only at the header level and not at the hunk

919

# Special files are shown only at the header level and not at the hunk

920

# level for example a file that has been deleted is a special file.

920

# level for example a file that has been deleted is a special file.

921

# The user cannot change the content of the operation, in the case of

921

# The user cannot change the content of the operation, in the case of

922

# the deleted file he has to take the deletion or not take it, he

922

# the deleted file he has to take the deletion or not take it, he

923

# cannot take some of it.

923

# cannot take some of it.

924

# Newly added files are special if they are empty, they are not special

924

# Newly added files are special if they are empty, they are not special

925

# if they have some content as we want to be able to change it

925

# if they have some content as we want to be able to change it

926

nocontent = len(self.header) == 2

926

nocontent = len(self.header) == 2

927

emptynewfile = self.isnewfile() and nocontent

927

emptynewfile = self.isnewfile() and nocontent

928

return (emptynewfile

928

return (emptynewfile

929

or any(self.special_re.match(h) for h in self.header))

929

or any(self.special_re.match(h) for h in self.header))

930

931

class recordhunk(object):

931

class recordhunk(object):

932

"""patch hunk

932

"""patch hunk

933

934

XXX shouldn't we merge this with the other hunk class?

934

XXX shouldn't we merge this with the other hunk class?

935

"""

935

"""

936

937

def __init__(self, header, fromline, toline, proc, before, hunk, after,

937

def __init__(self, header, fromline, toline, proc, before, hunk, after,

938

maxcontext=None):

938

maxcontext=None):

939

def trimcontext(lines, reverse=False):

939

def trimcontext(lines, reverse=False):

940

if maxcontext is not None:

940

if maxcontext is not None:

941

delta = len(lines) - maxcontext

941

delta = len(lines) - maxcontext

942

if delta > 0:

942

if delta > 0:

943

if reverse:

943

if reverse:

944

return delta, lines[delta:]

944

return delta, lines[delta:]

945

else:

945

else:

946

return delta, lines[:maxcontext]

946

return delta, lines[:maxcontext]

947

return 0, lines

947

return 0, lines

948

949

self.header = header

949

self.header = header

950

trimedbefore, self.before = trimcontext(before, True)

950

trimedbefore, self.before = trimcontext(before, True)

951

self.fromline = fromline + trimedbefore

951

self.fromline = fromline + trimedbefore

952

self.toline = toline + trimedbefore

952

self.toline = toline + trimedbefore

953

_trimedafter, self.after = trimcontext(after, False)

953

_trimedafter, self.after = trimcontext(after, False)

954

self.proc = proc

954

self.proc = proc

955

self.hunk = hunk

955

self.hunk = hunk

956

self.added, self.removed = self.countchanges(self.hunk)

956

self.added, self.removed = self.countchanges(self.hunk)

957

958

def __eq__(self, v):

958

def __eq__(self, v):

959

if not isinstance(v, recordhunk):

959

if not isinstance(v, recordhunk):

960

return False

960

return False

961

962

return ((v.hunk == self.hunk) and

962

return ((v.hunk == self.hunk) and

963

(v.proc == self.proc) and

963

(v.proc == self.proc) and

964

(self.fromline == v.fromline) and

964

(self.fromline == v.fromline) and

965

(self.header.files() == v.header.files()))

965

(self.header.files() == v.header.files()))

966

967

def __hash__(self):

967

def __hash__(self):

968

return hash((tuple(self.hunk),

968

return hash((tuple(self.hunk),

969

tuple(self.header.files()),

969

tuple(self.header.files()),

970

self.fromline,

970

self.fromline,

971

self.proc))

971

self.proc))

972

973

def countchanges(self, hunk):

973

def countchanges(self, hunk):

974

"""hunk -> (n+,n-)"""

974

"""hunk -> (n+,n-)"""

975

add = len([h for h in hunk if h.startswith('+')])

975

add = len([h for h in hunk if h.startswith('+')])

976

rem = len([h for h in hunk if h.startswith('-')])

976

rem = len([h for h in hunk if h.startswith('-')])

977

return add, rem

977

return add, rem

978

979

def reversehunk(self):

979

def reversehunk(self):

980

"""return another recordhunk which is the reverse of the hunk

980

"""return another recordhunk which is the reverse of the hunk

981

982

If this hunk is diff(A, B), the returned hunk is diff(B, A). To do

982

If this hunk is diff(A, B), the returned hunk is diff(B, A). To do

983

that, swap fromline/toline and +/- signs while keep other things

983

that, swap fromline/toline and +/- signs while keep other things

984

unchanged.

984

unchanged.

985

"""

985

"""

986

m = {'+': '-', '-': '+', '\\': '\\'}

986

m = {'+': '-', '-': '+', '\\': '\\'}

987

hunk = ['%s%s' % (m[l[0:1]], l[1:]) for l in self.hunk]

987

hunk = ['%s%s' % (m[l[0:1]], l[1:]) for l in self.hunk]

988

return recordhunk(self.header, self.toline, self.fromline, self.proc,

988

return recordhunk(self.header, self.toline, self.fromline, self.proc,

989

self.before, hunk, self.after)

989

self.before, hunk, self.after)

990

991

def write(self, fp):

991

def write(self, fp):

992

delta = len(self.before) + len(self.after)

992

delta = len(self.before) + len(self.after)

993

if self.after and self.after[-1] == '\\ No newline at end of file\n':

993

if self.after and self.after[-1] == '\\ No newline at end of file\n':

994

delta -= 1

994

delta -= 1

995

fromlen = delta + self.removed

995

fromlen = delta + self.removed

996

tolen = delta + self.added

996

tolen = delta + self.added

997

fp.write('@@ -%d,%d +%d,%d @@%s\n' %

997

fp.write('@@ -%d,%d +%d,%d @@%s\n' %

998

(self.fromline, fromlen, self.toline, tolen,

998

(self.fromline, fromlen, self.toline, tolen,

999

self.proc and (' ' + self.proc)))

999

self.proc and (' ' + self.proc)))

1000

fp.write(''.join(self.before + self.hunk + self.after))

1000

fp.write(''.join(self.before + self.hunk + self.after))

1001

1002

pretty = write

1002

pretty = write

1003

1004

def filename(self):

1004

def filename(self):

1005

return self.header.filename()

1005

return self.header.filename()

1006

1007

def __repr__(self):

1007

def __repr__(self):

1008

return '<hunk %r@%d>' % (self.filename(), self.fromline)

1008

return '<hunk %r@%d>' % (self.filename(), self.fromline)

1009

1010

def getmessages():

1010

def getmessages():

1011

return {

1011

return {

1012

'multiple': {

1012

'multiple': {

1013

'apply': _("apply change %d/%d to '%s'?"),

1013

'apply': _("apply change %d/%d to '%s'?"),

1014

'discard': _("discard change %d/%d to '%s'?"),

1014

'discard': _("discard change %d/%d to '%s'?"),

1015

'record': _("record change %d/%d to '%s'?"),

1015

'record': _("record change %d/%d to '%s'?"),

1016

},

1016

},

1017

'single': {

1017

'single': {

1018

'apply': _("apply this change to '%s'?"),

1018

'apply': _("apply this change to '%s'?"),

1019

'discard': _("discard this change to '%s'?"),

1019

'discard': _("discard this change to '%s'?"),

1020

'record': _("record this change to '%s'?"),

1020

'record': _("record this change to '%s'?"),

1021

},

1021

},

1022

'help': {

1022

'help': {

1023

'apply': _('[Ynesfdaq?]'

1023

'apply': _('[Ynesfdaq?]'

1024

'$$ &Yes, apply this change'

1024

'$$ &Yes, apply this change'

1025

'$$ &No, skip this change'

1025

'$$ &No, skip this change'

1026

'$$ &Edit this change manually'

1026

'$$ &Edit this change manually'

1027

'$$ &Skip remaining changes to this file'

1027

'$$ &Skip remaining changes to this file'

1028

'$$ Apply remaining changes to this &file'

1028

'$$ Apply remaining changes to this &file'

1029

'$$ &Done, skip remaining changes and files'

1029

'$$ &Done, skip remaining changes and files'

1030

'$$ Apply &all changes to all remaining files'

1030

'$$ Apply &all changes to all remaining files'

1031

'$$ &Quit, applying no changes'

1031

'$$ &Quit, applying no changes'

1032

'$$ &? (display help)'),

1032

'$$ &? (display help)'),

1033

'discard': _('[Ynesfdaq?]'

1033

'discard': _('[Ynesfdaq?]'

1034

'$$ &Yes, discard this change'

1034

'$$ &Yes, discard this change'

1035

'$$ &No, skip this change'

1035

'$$ &No, skip this change'

1036

'$$ &Edit this change manually'

1036

'$$ &Edit this change manually'

1037

'$$ &Skip remaining changes to this file'

1037

'$$ &Skip remaining changes to this file'

1038

'$$ Discard remaining changes to this &file'

1038

'$$ Discard remaining changes to this &file'

1039

'$$ &Done, skip remaining changes and files'

1039

'$$ &Done, skip remaining changes and files'

1040

'$$ Discard &all changes to all remaining files'

1040

'$$ Discard &all changes to all remaining files'

1041

'$$ &Quit, discarding no changes'

1041

'$$ &Quit, discarding no changes'

1042

'$$ &? (display help)'),

1042

'$$ &? (display help)'),

1043

'record': _('[Ynesfdaq?]'

1043

'record': _('[Ynesfdaq?]'

1044

'$$ &Yes, record this change'

1044

'$$ &Yes, record this change'

1045

'$$ &No, skip this change'

1045

'$$ &No, skip this change'

1046

'$$ &Edit this change manually'

1046

'$$ &Edit this change manually'

1047

'$$ &Skip remaining changes to this file'

1047

'$$ &Skip remaining changes to this file'

1048

'$$ Record remaining changes to this &file'

1048

'$$ Record remaining changes to this &file'

1049

'$$ &Done, skip remaining changes and files'

1049

'$$ &Done, skip remaining changes and files'

1050

'$$ Record &all changes to all remaining files'

1050

'$$ Record &all changes to all remaining files'

1051

'$$ &Quit, recording no changes'

1051

'$$ &Quit, recording no changes'

1052

'$$ &? (display help)'),

1052

'$$ &? (display help)'),

1053

}

1053

}

1054

}

1054

}

1055

1056

def filterpatch(ui, headers, operation=None):

1056

def filterpatch(ui, headers, operation=None):

1057

"""Interactively filter patch chunks into applied-only chunks"""

1057

"""Interactively filter patch chunks into applied-only chunks"""

1058

messages = getmessages()

1058

messages = getmessages()

1059

1060

if operation is None:

1060

if operation is None:

1061

operation = 'record'

1061

operation = 'record'

1062

1063

def prompt(skipfile, skipall, query, chunk):

1063

def prompt(skipfile, skipall, query, chunk):

1064

"""prompt query, and process base inputs

1064

"""prompt query, and process base inputs

1065

1066

- y/n for the rest of file

1066

- y/n for the rest of file

1067

- y/n for the rest

1067

- y/n for the rest

1068

- ? (help)

1068

- ? (help)

1069

- q (quit)

1069

- q (quit)

1070

1071

Return True/False and possibly updated skipfile and skipall.

1071

Return True/False and possibly updated skipfile and skipall.

1072

"""

1072

"""

1073

newpatches = None

1073

newpatches = None

1074

if skipall is not None:

1074

if skipall is not None:

1075

return skipall, skipfile, skipall, newpatches

1075

return skipall, skipfile, skipall, newpatches

1076

if skipfile is not None:

1076

if skipfile is not None:

1077

return skipfile, skipfile, skipall, newpatches

1077

return skipfile, skipfile, skipall, newpatches

1078

while True:

1078

while True:

1079

resps = messages['help'][operation]

1079

resps = messages['help'][operation]

1080

r = ui.promptchoice("%s %s" % (query, resps))

1080

r = ui.promptchoice("%s %s" % (query, resps))

1081

ui.write("\n")

1081

ui.write("\n")

1082

if r == 8: # ?

1082

if r == 8: # ?

1083

for c, t in ui.extractchoices(resps)[1]:

1083

for c, t in ui.extractchoices(resps)[1]:

1084

ui.write('%s - %s\n' % (c, encoding.lower(t)))

1084

ui.write('%s - %s\n' % (c, encoding.lower(t)))

1085

continue

1085

continue

1086

elif r == 0: # yes

1086

elif r == 0: # yes

1087

ret = True

1087

ret = True

1088

elif r == 1: # no

1088

elif r == 1: # no

1089

ret = False

1089

ret = False

1090

elif r == 2: # Edit patch

1090

elif r == 2: # Edit patch

1091

if chunk is None:

1091

if chunk is None:

1092

ui.write(_('cannot edit patch for whole file'))

1092

ui.write(_('cannot edit patch for whole file'))

1093

ui.write("\n")

1093

ui.write("\n")

1094

continue

1094

continue

1095

if chunk.header.binary():

1095

if chunk.header.binary():

1096

ui.write(_('cannot edit patch for binary file'))

1096

ui.write(_('cannot edit patch for binary file'))

1097

ui.write("\n")

1097

ui.write("\n")

1098

continue

1098

continue

1099

# Patch comment based on the Git one (based on comment at end of

1099

# Patch comment based on the Git one (based on comment at end of

1100

# https://mercurial-scm.org/wiki/RecordExtension)

1100

# https://mercurial-scm.org/wiki/RecordExtension)

1101

phelp = '---' + _("""

1101

phelp = '---' + _("""

1102

To remove '-' lines, make them ' ' lines (context).

1102

To remove '-' lines, make them ' ' lines (context).

1103

To remove '+' lines, delete them.

1103

To remove '+' lines, delete them.

1104

Lines starting with # will be removed from the patch.

1104

Lines starting with # will be removed from the patch.

1105

1106

If the patch applies cleanly, the edited hunk will immediately be

1106

If the patch applies cleanly, the edited hunk will immediately be

1107

added to the record list. If it does not apply cleanly, a rejects

1107

added to the record list. If it does not apply cleanly, a rejects

1108

file will be generated: you can use that when you try again. If

1108

file will be generated: you can use that when you try again. If

1109

all lines of the hunk are removed, then the edit is aborted and

1109

all lines of the hunk are removed, then the edit is aborted and

1110

the hunk is left unchanged.

1110

the hunk is left unchanged.

1111

""")

1111

""")

1112

(patchfd, patchfn) = pycompat.mkstemp(prefix="hg-editor-",

1112

(patchfd, patchfn) = pycompat.mkstemp(prefix="hg-editor-",

1113

suffix=".diff")

1113

suffix=".diff")

1114

ncpatchfp = None

1114

ncpatchfp = None

1115

try:

1115

try:

1116

# Write the initial patch

1116

# Write the initial patch

1117

f = util.nativeeolwriter(os.fdopen(patchfd, r'wb'))

1117

f = util.nativeeolwriter(os.fdopen(patchfd, r'wb'))

1118

chunk.header.write(f)

1118

chunk.header.write(f)

1119

chunk.write(f)

1119

chunk.write(f)

1120

f.write('\n'.join(['# ' + i ~~for~~ i in ~~phelp~~.~~splitlines()]))~~

1120

f.write(''.join(['# ' + i + '\n'

1121

for i in phelp.splitlines()]))

1121

f.close()

1122

f.close()

1122

# Start the editor and wait for it to complete

1123

# Start the editor and wait for it to complete

1123

editor = ui.geteditor()

1124

editor = ui.geteditor()

1124

ret = ui.system("%s \"%s\"" % (editor, patchfn),

1125

ret = ui.system("%s \"%s\"" % (editor, patchfn),

1125

environ={'HGUSER': ui.username()},

1126

environ={'HGUSER': ui.username()},

1126

blockedtag='filterpatch')

1127

blockedtag='filterpatch')

1127

if ret != 0:

1128

if ret != 0:

1128

ui.warn(_("editor exited with exit code %d\n") % ret)

1129

ui.warn(_("editor exited with exit code %d\n") % ret)

1129

continue

1130

continue

1130

# Remove comment lines

1131

# Remove comment lines

1131

patchfp = open(patchfn, r'rb')

1132

patchfp = open(patchfn, r'rb')

1132

ncpatchfp = stringio()

1133

ncpatchfp = stringio()

1133

for line in util.iterfile(patchfp):

1134

for line in util.iterfile(patchfp):

1134

line = util.fromnativeeol(line)

1135

line = util.fromnativeeol(line)

1135

if not line.startswith('#'):

1136

if not line.startswith('#'):

1136

ncpatchfp.write(line)

1137

ncpatchfp.write(line)

1137

patchfp.close()

1138

patchfp.close()

1138

ncpatchfp.seek(0)

1139

ncpatchfp.seek(0)

1139

newpatches = parsepatch(ncpatchfp)

1140

newpatches = parsepatch(ncpatchfp)

1140

finally:

1141

finally:

1141

os.unlink(patchfn)

1142

os.unlink(patchfn)

1142

del ncpatchfp

1143

del ncpatchfp

1143

# Signal that the chunk shouldn't be applied as-is, but

1144

# Signal that the chunk shouldn't be applied as-is, but

1144

# provide the new patch to be used instead.

1145

# provide the new patch to be used instead.

1145

ret = False

1146

ret = False

1146

elif r == 3: # Skip

1147

elif r == 3: # Skip

1147

ret = skipfile = False

1148

ret = skipfile = False

1148

elif r == 4: # file (Record remaining)

1149

elif r == 4: # file (Record remaining)

1149

ret = skipfile = True

1150

ret = skipfile = True

1150

elif r == 5: # done, skip remaining

1151

elif r == 5: # done, skip remaining

1151

ret = skipall = False

1152

ret = skipall = False

1152

elif r == 6: # all

1153

elif r == 6: # all

1153

ret = skipall = True

1154

ret = skipall = True

1154

elif r == 7: # quit

1155

elif r == 7: # quit

1155

raise error.Abort(_('user quit'))

1156

raise error.Abort(_('user quit'))

1156

return ret, skipfile, skipall, newpatches

1157

return ret, skipfile, skipall, newpatches

1157

1158

seen = set()

1159

seen = set()

1159

applied = {} # 'filename' -> [] of chunks

1160

applied = {} # 'filename' -> [] of chunks

1160

skipfile, skipall = None, None

1161

skipfile, skipall = None, None

1161

pos, total = 1, sum(len(h.hunks) for h in headers)

1162

pos, total = 1, sum(len(h.hunks) for h in headers)

1162

for h in headers:

1163

for h in headers:

1163

pos += len(h.hunks)

1164

pos += len(h.hunks)

1164

skipfile = None

1165

skipfile = None

1165

fixoffset = 0

1166

fixoffset = 0

1166

hdr = ''.join(h.header)

1167

hdr = ''.join(h.header)

1167

if hdr in seen:

1168

if hdr in seen:

1168

continue

1169

continue

1169

seen.add(hdr)

1170

seen.add(hdr)

1170

if skipall is None:

1171

if skipall is None:

1171

h.pretty(ui)

1172

h.pretty(ui)

1172

msg = (_('examine changes to %s?') %

1173

msg = (_('examine changes to %s?') %

1173

_(' and ').join("'%s'" % f for f in h.files()))

1174

_(' and ').join("'%s'" % f for f in h.files()))

1174

r, skipfile, skipall, np = prompt(skipfile, skipall, msg, None)

1175

r, skipfile, skipall, np = prompt(skipfile, skipall, msg, None)

1175

if not r:

1176

if not r:

1176

continue

1177

continue

1177

applied[h.filename()] = [h]

1178

applied[h.filename()] = [h]

1178

if h.allhunks():

1179

if h.allhunks():

1179

applied[h.filename()] += h.hunks

1180

applied[h.filename()] += h.hunks

1180

continue

1181

continue

1181

for i, chunk in enumerate(h.hunks):

1182

for i, chunk in enumerate(h.hunks):

1182

if skipfile is None and skipall is None:

1183

if skipfile is None and skipall is None:

1183

chunk.pretty(ui)

1184

chunk.pretty(ui)

1184

if total == 1:

1185

if total == 1:

1185

msg = messages['single'][operation] % chunk.filename()

1186

msg = messages['single'][operation] % chunk.filename()

1186

else:

1187

else:

1187

idx = pos - len(h.hunks) + i

1188

idx = pos - len(h.hunks) + i

1188

msg = messages['multiple'][operation] % (idx, total,

1189

msg = messages['multiple'][operation] % (idx, total,

1189

chunk.filename())

1190

chunk.filename())

1190

r, skipfile, skipall, newpatches = prompt(skipfile,

1191

r, skipfile, skipall, newpatches = prompt(skipfile,

1191

skipall, msg, chunk)

1192

skipall, msg, chunk)

1192

if r:

1193

if r:

1193

if fixoffset:

1194

if fixoffset:

1194

chunk = copy.copy(chunk)

1195

chunk = copy.copy(chunk)

1195

chunk.toline += fixoffset

1196

chunk.toline += fixoffset

1196

applied[chunk.filename()].append(chunk)

1197

applied[chunk.filename()].append(chunk)

1197

elif newpatches is not None:

1198

elif newpatches is not None:

1198

for newpatch in newpatches:

1199

for newpatch in newpatches:

1199

for newhunk in newpatch.hunks:

1200

for newhunk in newpatch.hunks:

1200

if fixoffset:

1201

if fixoffset:

1201

newhunk.toline += fixoffset

1202

newhunk.toline += fixoffset

1202

applied[newhunk.filename()].append(newhunk)

1203

applied[newhunk.filename()].append(newhunk)

1203

else:

1204

else:

1204

fixoffset += chunk.removed - chunk.added

1205

fixoffset += chunk.removed - chunk.added

1205

return (sum([h for h in applied.itervalues()

1206

return (sum([h for h in applied.itervalues()

1206

if h[0].special() or len(h) > 1], []), {})

1207

if h[0].special() or len(h) > 1], []), {})

1207

class hunk(object):

1208

class hunk(object):

1208

def __init__(self, desc, num, lr, context):

1209

def __init__(self, desc, num, lr, context):

1209

self.number = num

1210

self.number = num

1210

self.desc = desc

1211

self.desc = desc

1211

self.hunk = [desc]

1212

self.hunk = [desc]

1212

self.a = []

1213

self.a = []

1213

self.b = []

1214

self.b = []

1214

self.starta = self.lena = None

1215

self.starta = self.lena = None

1215

self.startb = self.lenb = None

1216

self.startb = self.lenb = None

1216

if lr is not None:

1217

if lr is not None:

1217

if context:

1218

if context:

1218

self.read_context_hunk(lr)

1219

self.read_context_hunk(lr)

1219

else:

1220

else:

1220

self.read_unified_hunk(lr)

1221

self.read_unified_hunk(lr)

1221

1222

def getnormalized(self):

1223

def getnormalized(self):

1223

"""Return a copy with line endings normalized to LF."""

1224

"""Return a copy with line endings normalized to LF."""

1224

1225

def normalize(lines):

1226

def normalize(lines):

1226

nlines = []

1227

nlines = []

1227

for line in lines:

1228

for line in lines:

1228

if line.endswith('\r\n'):

1229

if line.endswith('\r\n'):

1229

line = line[:-2] + '\n'

1230

line = line[:-2] + '\n'

1230

nlines.append(line)

1231

nlines.append(line)

1231

return nlines

1232

return nlines

1232

1233

# Dummy object, it is rebuilt manually

1234

# Dummy object, it is rebuilt manually

1234

nh = hunk(self.desc, self.number, None, None)

1235

nh = hunk(self.desc, self.number, None, None)

1235

nh.number = self.number

1236

nh.number = self.number

1236

nh.desc = self.desc

1237

nh.desc = self.desc

1237

nh.hunk = self.hunk

1238

nh.hunk = self.hunk

1238

nh.a = normalize(self.a)

1239

nh.a = normalize(self.a)

1239

nh.b = normalize(self.b)

1240

nh.b = normalize(self.b)

1240

nh.starta = self.starta

1241

nh.starta = self.starta

1241

nh.startb = self.startb

1242

nh.startb = self.startb

1242

nh.lena = self.lena

1243

nh.lena = self.lena

1243

nh.lenb = self.lenb

1244

nh.lenb = self.lenb

1244

return nh

1245

return nh

1245

1246

def read_unified_hunk(self, lr):

1247

def read_unified_hunk(self, lr):

1247

m = unidesc.match(self.desc)

1248

m = unidesc.match(self.desc)

1248

if not m:

1249

if not m:

1249

raise PatchError(_("bad hunk #%d") % self.number)

1250

raise PatchError(_("bad hunk #%d") % self.number)

1250

self.starta, self.lena, self.startb, self.lenb = m.groups()

1251

self.starta, self.lena, self.startb, self.lenb = m.groups()

1251

if self.lena is None:

1252

if self.lena is None:

1252

self.lena = 1

1253

self.lena = 1

1253

else:

1254

else:

1254

self.lena = int(self.lena)

1255

self.lena = int(self.lena)

1255

if self.lenb is None:

1256

if self.lenb is None:

1256

self.lenb = 1

1257

self.lenb = 1

1257

else:

1258

else:

1258

self.lenb = int(self.lenb)

1259

self.lenb = int(self.lenb)

1259

self.starta = int(self.starta)

1260

self.starta = int(self.starta)

1260

self.startb = int(self.startb)

1261

self.startb = int(self.startb)

1261

try:

1262

try:

1262

diffhelper.addlines(lr, self.hunk, self.lena, self.lenb,

1263

diffhelper.addlines(lr, self.hunk, self.lena, self.lenb,

1263

self.a, self.b)

1264

self.a, self.b)

1264

except error.ParseError as e:

1265

except error.ParseError as e:

1265

raise PatchError(_("bad hunk #%d: %s") % (self.number, e))

1266

raise PatchError(_("bad hunk #%d: %s") % (self.number, e))

1266

# if we hit eof before finishing out the hunk, the last line will

1267

# if we hit eof before finishing out the hunk, the last line will

1267

# be zero length. Lets try to fix it up.

1268

# be zero length. Lets try to fix it up.

1268

while len(self.hunk[-1]) == 0:

1269

while len(self.hunk[-1]) == 0:

1269

del self.hunk[-1]

1270

del self.hunk[-1]

1270

del self.a[-1]

1271

del self.a[-1]

1271

del self.b[-1]

1272

del self.b[-1]

1272

self.lena -= 1

1273

self.lena -= 1

1273

self.lenb -= 1

1274

self.lenb -= 1

1274

self._fixnewline(lr)

1275

self._fixnewline(lr)

1275

1276

def read_context_hunk(self, lr):

1277

def read_context_hunk(self, lr):

1277

self.desc = lr.readline()

1278

self.desc = lr.readline()

1278

m = contextdesc.match(self.desc)

1279

m = contextdesc.match(self.desc)

1279

if not m:

1280

if not m:

1280

raise PatchError(_("bad hunk #%d") % self.number)

1281

raise PatchError(_("bad hunk #%d") % self.number)

1281

self.starta, aend = m.groups()

1282

self.starta, aend = m.groups()

1282

self.starta = int(self.starta)

1283

self.starta = int(self.starta)

1283

if aend is None:

1284

if aend is None:

1284

aend = self.starta

1285

aend = self.starta

1285

self.lena = int(aend) - self.starta

1286

self.lena = int(aend) - self.starta

1286

if self.starta:

1287

if self.starta:

1287

self.lena += 1

1288

self.lena += 1

1288

for x in pycompat.xrange(self.lena):

1289

for x in pycompat.xrange(self.lena):

1289

l = lr.readline()

1290

l = lr.readline()

1290

if l.startswith('---'):

1291

if l.startswith('---'):

1291

# lines addition, old block is empty

1292

# lines addition, old block is empty

1292

lr.push(l)

1293

lr.push(l)

1293

break

1294

break

1294

s = l[2:]

1295

s = l[2:]

1295

if l.startswith('- ') or l.startswith('! '):

1296

if l.startswith('- ') or l.startswith('! '):

1296

u = '-' + s

1297

u = '-' + s

1297

elif l.startswith(' '):

1298

elif l.startswith(' '):

1298

u = ' ' + s

1299

u = ' ' + s

1299

else:

1300

else:

1300

raise PatchError(_("bad hunk #%d old text line %d") %

1301

raise PatchError(_("bad hunk #%d old text line %d") %

1301

(self.number, x))

1302

(self.number, x))

1302

self.a.append(u)

1303

self.a.append(u)

1303

self.hunk.append(u)

1304

self.hunk.append(u)

1304

1305

l = lr.readline()

1306

l = lr.readline()

1306

if l.startswith(br'\ '):

1307

if l.startswith(br'\ '):

1307

s = self.a[-1][:-1]

1308

s = self.a[-1][:-1]

1308

self.a[-1] = s

1309

self.a[-1] = s

1309

self.hunk[-1] = s

1310

self.hunk[-1] = s

1310

l = lr.readline()

1311

l = lr.readline()

1311

m = contextdesc.match(l)

1312

m = contextdesc.match(l)

1312

if not m:

1313

if not m:

1313

raise PatchError(_("bad hunk #%d") % self.number)

1314

raise PatchError(_("bad hunk #%d") % self.number)

1314

self.startb, bend = m.groups()

1315

self.startb, bend = m.groups()

1315

self.startb = int(self.startb)

1316

self.startb = int(self.startb)

1316

if bend is None:

1317

if bend is None:

1317

bend = self.startb

1318

bend = self.startb

1318

self.lenb = int(bend) - self.startb

1319

self.lenb = int(bend) - self.startb

1319

if self.startb:

1320

if self.startb:

1320

self.lenb += 1

1321

self.lenb += 1

1321

hunki = 1

1322

hunki = 1

1322

for x in pycompat.xrange(self.lenb):

1323

for x in pycompat.xrange(self.lenb):

1323

l = lr.readline()

1324

l = lr.readline()

1324

if l.startswith(br'\ '):

1325

if l.startswith(br'\ '):

1325

# XXX: the only way to hit this is with an invalid line range.

1326

# XXX: the only way to hit this is with an invalid line range.

1326

# The no-eol marker is not counted in the line range, but I

1327

# The no-eol marker is not counted in the line range, but I

1327

# guess there are diff(1) out there which behave differently.

1328

# guess there are diff(1) out there which behave differently.

1328

s = self.b[-1][:-1]

1329

s = self.b[-1][:-1]

1329

self.b[-1] = s

1330

self.b[-1] = s

1330

self.hunk[hunki - 1] = s

1331

self.hunk[hunki - 1] = s

1331

continue

1332

continue

1332

if not l:

1333

if not l:

1333

# line deletions, new block is empty and we hit EOF

1334

# line deletions, new block is empty and we hit EOF

1334

lr.push(l)

1335

lr.push(l)

1335

break

1336

break

1336

s = l[2:]

1337

s = l[2:]

1337

if l.startswith('+ ') or l.startswith('! '):

1338

if l.startswith('+ ') or l.startswith('! '):

1338

u = '+' + s

1339

u = '+' + s

1339

elif l.startswith(' '):

1340

elif l.startswith(' '):

1340

u = ' ' + s

1341

u = ' ' + s

1341

elif len(self.b) == 0:

1342

elif len(self.b) == 0:

1342

# line deletions, new block is empty

1343

# line deletions, new block is empty

1343

lr.push(l)

1344

lr.push(l)

1344

break

1345

break

1345

else:

1346

else:

1346

raise PatchError(_("bad hunk #%d old text line %d") %

1347

raise PatchError(_("bad hunk #%d old text line %d") %

1347

(self.number, x))

1348

(self.number, x))

1348

self.b.append(s)

1349

self.b.append(s)

1349

while True:

1350

while True:

1350

if hunki >= len(self.hunk):

1351

if hunki >= len(self.hunk):

1351

h = ""

1352

h = ""

1352

else:

1353

else:

1353

h = self.hunk[hunki]

1354

h = self.hunk[hunki]

1354

hunki += 1

1355

hunki += 1

1355

if h == u:

1356

if h == u:

1356

break

1357

break

1357

elif h.startswith('-'):

1358

elif h.startswith('-'):

1358

continue

1359

continue

1359

else:

1360

else:

1360

self.hunk.insert(hunki - 1, u)

1361

self.hunk.insert(hunki - 1, u)

1361

break

1362

break

1362

1363

if not self.a:

1364

if not self.a:

1364

# this happens when lines were only added to the hunk

1365

# this happens when lines were only added to the hunk

1365

for x in self.hunk:

1366

for x in self.hunk:

1366

if x.startswith('-') or x.startswith(' '):

1367

if x.startswith('-') or x.startswith(' '):

1367

self.a.append(x)

1368

self.a.append(x)

1368

if not self.b:

1369

if not self.b:

1369

# this happens when lines were only deleted from the hunk

1370

# this happens when lines were only deleted from the hunk

1370

for x in self.hunk:

1371

for x in self.hunk:

1371

if x.startswith('+') or x.startswith(' '):

1372

if x.startswith('+') or x.startswith(' '):

1372

self.b.append(x[1:])

1373

self.b.append(x[1:])

1373

# @@ -start,len +start,len @@

1374

# @@ -start,len +start,len @@

1374

self.desc = "@@ -%d,%d +%d,%d @@\n" % (self.starta, self.lena,

1375

self.desc = "@@ -%d,%d +%d,%d @@\n" % (self.starta, self.lena,

1375

self.startb, self.lenb)

1376

self.startb, self.lenb)

1376

self.hunk[0] = self.desc

1377

self.hunk[0] = self.desc

1377

self._fixnewline(lr)

1378

self._fixnewline(lr)

1378

1379

def _fixnewline(self, lr):

1380

def _fixnewline(self, lr):

1380

l = lr.readline()

1381

l = lr.readline()

1381

if l.startswith(br'\ '):

1382

if l.startswith(br'\ '):

1382

diffhelper.fixnewline(self.hunk, self.a, self.b)

1383

diffhelper.fixnewline(self.hunk, self.a, self.b)

1383

else:

1384

else:

1384

lr.push(l)

1385

lr.push(l)

1385

1386

def complete(self):

1387

def complete(self):

1387

return len(self.a) == self.lena and len(self.b) == self.lenb

1388

return len(self.a) == self.lena and len(self.b) == self.lenb

1388

1389

def _fuzzit(self, old, new, fuzz, toponly):

1390

def _fuzzit(self, old, new, fuzz, toponly):

1390

# this removes context lines from the top and bottom of list 'l'. It

1391

# this removes context lines from the top and bottom of list 'l'. It

1391

# checks the hunk to make sure only context lines are removed, and then

1392

# checks the hunk to make sure only context lines are removed, and then

1392

# returns a new shortened list of lines.

1393

# returns a new shortened list of lines.

1393

fuzz = min(fuzz, len(old))

1394

fuzz = min(fuzz, len(old))

1394

if fuzz:

1395

if fuzz:

1395

top = 0

1396

top = 0

1396

bot = 0

1397

bot = 0

1397

hlen = len(self.hunk)

1398

hlen = len(self.hunk)

1398

for x in pycompat.xrange(hlen - 1):

1399

for x in pycompat.xrange(hlen - 1):

1399

# the hunk starts with the @@ line, so use x+1

1400

# the hunk starts with the @@ line, so use x+1

1400

if self.hunk[x + 1].startswith(' '):

1401

if self.hunk[x + 1].startswith(' '):

1401

top += 1

1402

top += 1

1402

else:

1403

else:

1403

break

1404

break

1404

if not toponly:

1405

if not toponly:

1405

for x in pycompat.xrange(hlen - 1):

1406

for x in pycompat.xrange(hlen - 1):

1406

if self.hunk[hlen - bot - 1].startswith(' '):

1407

if self.hunk[hlen - bot - 1].startswith(' '):

1407

bot += 1

1408

bot += 1

1408

else:

1409

else:

1409

break

1410

break

1410

1411

bot = min(fuzz, bot)

1412

bot = min(fuzz, bot)

1412

top = min(fuzz, top)

1413

top = min(fuzz, top)

1413

return old[top:len(old) - bot], new[top:len(new) - bot], top

1414

return old[top:len(old) - bot], new[top:len(new) - bot], top

1414

return old, new, 0

1415

return old, new, 0

1415

1416

def fuzzit(self, fuzz, toponly):

1417

def fuzzit(self, fuzz, toponly):

1417

old, new, top = self._fuzzit(self.a, self.b, fuzz, toponly)

1418

old, new, top = self._fuzzit(self.a, self.b, fuzz, toponly)

1418

oldstart = self.starta + top

1419

oldstart = self.starta + top

1419

newstart = self.startb + top

1420

newstart = self.startb + top

1420

# zero length hunk ranges already have their start decremented

1421

# zero length hunk ranges already have their start decremented

1421

if self.lena and oldstart > 0:

1422

if self.lena and oldstart > 0:

1422

oldstart -= 1

1423

oldstart -= 1

1423

if self.lenb and newstart > 0:

1424

if self.lenb and newstart > 0:

1424

newstart -= 1

1425

newstart -= 1

1425

return old, oldstart, new, newstart

1426

return old, oldstart, new, newstart

1426

1427

class binhunk(object):

1428

class binhunk(object):

1428

'A binary patch file.'

1429

'A binary patch file.'

1429

def __init__(self, lr, fname):

1430

def __init__(self, lr, fname):

1430

self.text = None

1431

self.text = None

1431

self.delta = False

1432

self.delta = False

1432

self.hunk = ['GIT binary patch\n']

1433

self.hunk = ['GIT binary patch\n']

1433

self._fname = fname

1434

self._fname = fname

1434

self._read(lr)

1435

self._read(lr)

1435

1436

def complete(self):

1437

def complete(self):

1437

return self.text is not None

1438

return self.text is not None

1438

1439

def new(self, lines):

1440

def new(self, lines):

1440

if self.delta:

1441

if self.delta:

1441

return [applybindelta(self.text, ''.join(lines))]

1442

return [applybindelta(self.text, ''.join(lines))]

1442

return [self.text]

1443

return [self.text]

1443

1444

def _read(self, lr):

1445

def _read(self, lr):

1445

def getline(lr, hunk):

1446

def getline(lr, hunk):

1446

l = lr.readline()

1447

l = lr.readline()

1447

hunk.append(l)

1448

hunk.append(l)

1448

return l.rstrip('\r\n')

1449

return l.rstrip('\r\n')

1449

1450

while True:

1451

while True:

1451

line = getline(lr, self.hunk)

1452

line = getline(lr, self.hunk)

1452

if not line:

1453

if not line:

1453

raise PatchError(_('could not extract "%s" binary data')

1454

raise PatchError(_('could not extract "%s" binary data')

1454

% self._fname)

1455

% self._fname)

1455

if line.startswith('literal '):

1456

if line.startswith('literal '):

1456

size = int(line[8:].rstrip())

1457

size = int(line[8:].rstrip())

1457

break

1458

break

1458

if line.startswith('delta '):

1459

if line.startswith('delta '):

1459

size = int(line[6:].rstrip())

1460

size = int(line[6:].rstrip())

1460

self.delta = True

1461

self.delta = True

1461

break

1462

break

1462

dec = []

1463

dec = []

1463

line = getline(lr, self.hunk)

1464

line = getline(lr, self.hunk)

1464

while len(line) > 1:

1465

while len(line) > 1:

1465

l = line[0:1]

1466

l = line[0:1]

1466

if l <= 'Z' and l >= 'A':

1467

if l <= 'Z' and l >= 'A':

1467

l = ord(l) - ord('A') + 1

1468

l = ord(l) - ord('A') + 1

1468

else:

1469

else:

1469

l = ord(l) - ord('a') + 27

1470

l = ord(l) - ord('a') + 27

1470

try:

1471

try:

1471

dec.append(util.b85decode(line[1:])[:l])

1472

dec.append(util.b85decode(line[1:])[:l])

1472

except ValueError as e:

1473

except ValueError as e:

1473

raise PatchError(_('could not decode "%s" binary patch: %s')

1474

raise PatchError(_('could not decode "%s" binary patch: %s')

1474

% (self._fname, stringutil.forcebytestr(e)))

1475

% (self._fname, stringutil.forcebytestr(e)))

1475

line = getline(lr, self.hunk)

1476

line = getline(lr, self.hunk)

1476

text = zlib.decompress(''.join(dec))

1477

text = zlib.decompress(''.join(dec))

1477

if len(text) != size:

1478

if len(text) != size:

1478

raise PatchError(_('"%s" length is %d bytes, should be %d')

1479

raise PatchError(_('"%s" length is %d bytes, should be %d')

1479

% (self._fname, len(text), size))

1480

% (self._fname, len(text), size))

1480

self.text = text

1481

self.text = text

1481

1482

def parsefilename(str):

1483

def parsefilename(str):

1483

# --- filename \t|space stuff

1484

# --- filename \t|space stuff

1484

s = str[4:].rstrip('\r\n')

1485

s = str[4:].rstrip('\r\n')

1485

i = s.find('\t')

1486

i = s.find('\t')

1486

if i < 0:

1487

if i < 0:

1487

i = s.find(' ')

1488

i = s.find(' ')

1488

if i < 0:

1489

if i < 0:

1489

return s

1490

return s

1490

return s[:i]

1491

return s[:i]

1491

1492

def reversehunks(hunks):

1493

def reversehunks(hunks):

1493

'''reverse the signs in the hunks given as argument

1494

'''reverse the signs in the hunks given as argument

1494

1495

This function operates on hunks coming out of patch.filterpatch, that is

1496

This function operates on hunks coming out of patch.filterpatch, that is

1496

a list of the form: [header1, hunk1, hunk2, header2...]. Example usage:

1497

a list of the form: [header1, hunk1, hunk2, header2...]. Example usage:

1497

1498

>>> rawpatch = b"""diff --git a/folder1/g b/folder1/g

1499

>>> rawpatch = b"""diff --git a/folder1/g b/folder1/g

1499

... --- a/folder1/g

1500

... --- a/folder1/g

1500

... +++ b/folder1/g

1501

... +++ b/folder1/g

1501

... @@ -1,7 +1,7 @@

1502

... @@ -1,7 +1,7 @@

1502

... +firstline

1503

... +firstline

1503

... c

1504

... c

1504

... 1

1505

... 1

1505

... 2

1506

... 2

1506

... + 3

1507

... + 3

1507

... -4

1508

... -4

1508

... 5

1509

... 5

1509

... d

1510

... d

1510

... +lastline"""

1511

... +lastline"""

1511

>>> hunks = parsepatch([rawpatch])

1512

>>> hunks = parsepatch([rawpatch])

1512

>>> hunkscomingfromfilterpatch = []

1513

>>> hunkscomingfromfilterpatch = []

1513

>>> for h in hunks:

1514

>>> for h in hunks:

1514

... hunkscomingfromfilterpatch.append(h)

1515

... hunkscomingfromfilterpatch.append(h)

1515

... hunkscomingfromfilterpatch.extend(h.hunks)

1516

... hunkscomingfromfilterpatch.extend(h.hunks)

1516

1517

>>> reversedhunks = reversehunks(hunkscomingfromfilterpatch)

1518

>>> reversedhunks = reversehunks(hunkscomingfromfilterpatch)

1518

>>> from . import util

1519

>>> from . import util

1519

>>> fp = util.stringio()

1520

>>> fp = util.stringio()

1520

>>> for c in reversedhunks:

1521

>>> for c in reversedhunks:

1521

... c.write(fp)

1522

... c.write(fp)

1522

>>> fp.seek(0) or None

1523

>>> fp.seek(0) or None

1523

>>> reversedpatch = fp.read()

1524

>>> reversedpatch = fp.read()

1524

>>> print(pycompat.sysstr(reversedpatch))

1525

>>> print(pycompat.sysstr(reversedpatch))

1525

diff --git a/folder1/g b/folder1/g

1526

diff --git a/folder1/g b/folder1/g

1526

--- a/folder1/g

1527

--- a/folder1/g

1527

+++ b/folder1/g

1528

+++ b/folder1/g

1528

@@ -1,4 +1,3 @@

1529

@@ -1,4 +1,3 @@

1529

-firstline

1530

-firstline

1530

c

1531

c

1531

1

1532

1

1532

2

1533

2

1533

@@ -2,6 +1,6 @@

1534

@@ -2,6 +1,6 @@

1534

c

1535

c

1535

1

1536

1

1536

2

1537

2

1537

- 3

1538

- 3

1538

+4

1539

+4

1539

5

1540

5

1540

d

1541

d

1541

@@ -6,3 +5,2 @@

1542

@@ -6,3 +5,2 @@

1542

5

1543

5

1543

d

1544

d

1544

-lastline

1545

-lastline

1545

1546

'''

1547

'''

1547

1548

newhunks = []

1549

newhunks = []

1549

for c in hunks:

1550

for c in hunks:

1550

if util.safehasattr(c, 'reversehunk'):

1551

if util.safehasattr(c, 'reversehunk'):

1551

c = c.reversehunk()

1552

c = c.reversehunk()

1552

newhunks.append(c)

1553

newhunks.append(c)

1553

return newhunks

1554

return newhunks

1554

1555

def parsepatch(originalchunks, maxcontext=None):

1556

def parsepatch(originalchunks, maxcontext=None):

1556

"""patch -> [] of headers -> [] of hunks

1557

"""patch -> [] of headers -> [] of hunks

1557

1558

If maxcontext is not None, trim context lines if necessary.

1559

If maxcontext is not None, trim context lines if necessary.

1559

1560

>>> rawpatch = b'''diff --git a/folder1/g b/folder1/g

1561

>>> rawpatch = b'''diff --git a/folder1/g b/folder1/g

1561

... --- a/folder1/g

1562

... --- a/folder1/g

1562

... +++ b/folder1/g

1563

... +++ b/folder1/g

1563

... @@ -1,8 +1,10 @@

1564

... @@ -1,8 +1,10 @@

1564

... 1

1565

... 1

1565

... 2

1566

... 2

1566

... -3

1567

... -3

1567

... 4

1568

... 4

1568

... 5

1569

... 5

1569

... 6

1570

... 6

1570

... +6.1

1571

... +6.1

1571

... +6.2

1572

... +6.2

1572

... 7

1573

... 7

1573

... 8

1574

... 8

1574

... +9'''

1575

... +9'''

1575

>>> out = util.stringio()

1576

>>> out = util.stringio()

1576

>>> headers = parsepatch([rawpatch], maxcontext=1)

1577

>>> headers = parsepatch([rawpatch], maxcontext=1)

1577

>>> for header in headers:

1578

>>> for header in headers:

1578

... header.write(out)

1579

... header.write(out)

1579

... for hunk in header.hunks:

1580

... for hunk in header.hunks:

1580

... hunk.write(out)

1581

... hunk.write(out)

1581

>>> print(pycompat.sysstr(out.getvalue()))

1582

>>> print(pycompat.sysstr(out.getvalue()))

1582

diff --git a/folder1/g b/folder1/g

1583

diff --git a/folder1/g b/folder1/g

1583

--- a/folder1/g

1584

--- a/folder1/g

1584

+++ b/folder1/g

1585

+++ b/folder1/g

1585

@@ -2,3 +2,2 @@

1586

@@ -2,3 +2,2 @@

1586

2

1587

2

1587

-3

1588

-3

1588

4

1589

4

1589

@@ -6,2 +5,4 @@

1590

@@ -6,2 +5,4 @@

1590

6

1591

6

1591

+6.1

1592

+6.1

1592

+6.2

1593

+6.2

1593

7

1594

7

1594

@@ -8,1 +9,2 @@

1595

@@ -8,1 +9,2 @@

1595

8

1596

8

1596

+9

1597

+9

1597

"""

1598

"""

1598

class parser(object):

1599

class parser(object):

1599

"""patch parsing state machine"""

1600

"""patch parsing state machine"""

1600

def __init__(self):

1601

def __init__(self):

1601

self.fromline = 0

1602

self.fromline = 0

1602

self.toline = 0

1603

self.toline = 0

1603

self.proc = ''

1604

self.proc = ''

1604

self.header = None

1605

self.header = None

1605

self.context = []

1606

self.context = []

1606

self.before = []

1607

self.before = []

1607

self.hunk = []

1608

self.hunk = []

1608

self.headers = []

1609

self.headers = []

1609

1610

def addrange(self, limits):

1611

def addrange(self, limits):

1611

self.addcontext([])

1612

self.addcontext([])

1612

fromstart, fromend, tostart, toend, proc = limits

1613

fromstart, fromend, tostart, toend, proc = limits

1613

self.fromline = int(fromstart)

1614

self.fromline = int(fromstart)

1614

self.toline = int(tostart)

1615

self.toline = int(tostart)

1615

self.proc = proc

1616

self.proc = proc

1616

1617

def addcontext(self, context):

1618

def addcontext(self, context):

1618

if self.hunk:

1619

if self.hunk:

1619

h = recordhunk(self.header, self.fromline, self.toline,

1620

h = recordhunk(self.header, self.fromline, self.toline,

1620

self.proc, self.before, self.hunk, context, maxcontext)

1621

self.proc, self.before, self.hunk, context, maxcontext)

1621

self.header.hunks.append(h)

1622

self.header.hunks.append(h)

1622

self.fromline += len(self.before) + h.removed

1623

self.fromline += len(self.before) + h.removed

1623

self.toline += len(self.before) + h.added

1624

self.toline += len(self.before) + h.added

1624

self.before = []

1625

self.before = []

1625

self.hunk = []

1626

self.hunk = []

1626

self.context = context

1627

self.context = context

1627

1628

def addhunk(self, hunk):

1629

def addhunk(self, hunk):

1629

if self.context:

1630

if self.context:

1630

self.before = self.context

1631

self.before = self.context

1631

self.context = []

1632

self.context = []

1632

if self.hunk:

1633

if self.hunk:

1633

self.addcontext([])

1634

self.addcontext([])

1634

self.hunk = hunk

1635

self.hunk = hunk

1635

1636

def newfile(self, hdr):

1637

def newfile(self, hdr):

1637

self.addcontext([])

1638

self.addcontext([])

1638

h = header(hdr)

1639

h = header(hdr)

1639

self.headers.append(h)

1640

self.headers.append(h)

1640

self.header = h

1641

self.header = h

1641

1642

def addother(self, line):

1643

def addother(self, line):

1643

pass # 'other' lines are ignored

1644

pass # 'other' lines are ignored

1644

1645

def finished(self):

1646

def finished(self):

1646

self.addcontext([])

1647

self.addcontext([])

1647

return self.headers

1648

return self.headers

1648

1649

transitions = {

1650

transitions = {

1650

'file': {'context': addcontext,

1651

'file': {'context': addcontext,

1651

'file': newfile,

1652

'file': newfile,

1652

'hunk': addhunk,

1653

'hunk': addhunk,

1653

'range': addrange},

1654

'range': addrange},

1654

'context': {'file': newfile,

1655

'context': {'file': newfile,

1655

'hunk': addhunk,

1656

'hunk': addhunk,

1656

'range': addrange,

1657

'range': addrange,

1657

'other': addother},

1658

'other': addother},

1658

'hunk': {'context': addcontext,

1659

'hunk': {'context': addcontext,

1659

'file': newfile,

1660

'file': newfile,

1660

'range': addrange},

1661

'range': addrange},

1661

'range': {'context': addcontext,

1662

'range': {'context': addcontext,

1662

'hunk': addhunk},

1663

'hunk': addhunk},

1663

'other': {'other': addother},

1664

'other': {'other': addother},

1664

}

1665

}

1665

1666

p = parser()

1667

p = parser()

1667

fp = stringio()

1668

fp = stringio()

1668

fp.write(''.join(originalchunks))

1669

fp.write(''.join(originalchunks))

1669

fp.seek(0)

1670

fp.seek(0)

1670

1671

state = 'context'

1672

state = 'context'

1672

for newstate, data in scanpatch(fp):

1673

for newstate, data in scanpatch(fp):

1673

try:

1674

try:

1674

p.transitions[state][newstate](p, data)

1675

p.transitions[state][newstate](p, data)

1675

except KeyError:

1676

except KeyError:

1676

raise PatchError('unhandled transition: %s -> %s' %

1677

raise PatchError('unhandled transition: %s -> %s' %

1677

(state, newstate))

1678

(state, newstate))

1678

state = newstate

1679

state = newstate

1679

del fp

1680

del fp

1680

return p.finished()

1681

return p.finished()

1681

1682

def pathtransform(path, strip, prefix):

1683

def pathtransform(path, strip, prefix):

1683

'''turn a path from a patch into a path suitable for the repository

1684

'''turn a path from a patch into a path suitable for the repository

1684

1685

prefix, if not empty, is expected to be normalized with a / at the end.

1686

prefix, if not empty, is expected to be normalized with a / at the end.

1686

1687

Returns (stripped components, path in repository).

1688

Returns (stripped components, path in repository).

1688

1689

>>> pathtransform(b'a/b/c', 0, b'')

1690

>>> pathtransform(b'a/b/c', 0, b'')

1690

('', 'a/b/c')

1691

('', 'a/b/c')

1691

>>> pathtransform(b' a/b/c ', 0, b'')

1692

>>> pathtransform(b' a/b/c ', 0, b'')

1692

('', ' a/b/c')

1693

('', ' a/b/c')

1693

>>> pathtransform(b' a/b/c ', 2, b'')

1694

>>> pathtransform(b' a/b/c ', 2, b'')

1694

('a/b/', 'c')

1695

('a/b/', 'c')

1695

>>> pathtransform(b'a/b/c', 0, b'd/e/')

1696

>>> pathtransform(b'a/b/c', 0, b'd/e/')

1696

('', 'd/e/a/b/c')

1697

('', 'd/e/a/b/c')

1697

>>> pathtransform(b' a//b/c ', 2, b'd/e/')

1698

>>> pathtransform(b' a//b/c ', 2, b'd/e/')

1698

('a//b/', 'd/e/c')

1699

('a//b/', 'd/e/c')

1699

>>> pathtransform(b'a/b/c', 3, b'')

1700

>>> pathtransform(b'a/b/c', 3, b'')

1700

Traceback (most recent call last):

1701

Traceback (most recent call last):

1701

PatchError: unable to strip away 1 of 3 dirs from a/b/c

1702

PatchError: unable to strip away 1 of 3 dirs from a/b/c

1702

'''

1703

'''

1703

pathlen = len(path)

1704

pathlen = len(path)

1704

i = 0

1705

i = 0

1705

if strip == 0:

1706

if strip == 0:

1706

return '', prefix + path.rstrip()

1707

return '', prefix + path.rstrip()

1707

count = strip

1708

count = strip

1708

while count > 0:

1709

while count > 0:

1709

i = path.find('/', i)

1710

i = path.find('/', i)

1710

if i == -1:

1711

if i == -1:

1711

raise PatchError(_("unable to strip away %d of %d dirs from %s") %

1712

raise PatchError(_("unable to strip away %d of %d dirs from %s") %

1712

(count, strip, path))

1713

(count, strip, path))

1713

i += 1

1714

i += 1

1714

# consume '//' in the path

1715

# consume '//' in the path

1715

while i < pathlen - 1 and path[i:i + 1] == '/':

1716

while i < pathlen - 1 and path[i:i + 1] == '/':

1716

i += 1

1717

i += 1

1717

count -= 1

1718

count -= 1

1718

return path[:i].lstrip(), prefix + path[i:].rstrip()

1719

return path[:i].lstrip(), prefix + path[i:].rstrip()

1719

1720

def makepatchmeta(backend, afile_orig, bfile_orig, hunk, strip, prefix):

1721

def makepatchmeta(backend, afile_orig, bfile_orig, hunk, strip, prefix):

1721

nulla = afile_orig == "/dev/null"

1722

nulla = afile_orig == "/dev/null"

1722

nullb = bfile_orig == "/dev/null"

1723

nullb = bfile_orig == "/dev/null"

1723

create = nulla and hunk.starta == 0 and hunk.lena == 0

1724

create = nulla and hunk.starta == 0 and hunk.lena == 0

1724

remove = nullb and hunk.startb == 0 and hunk.lenb == 0

1725

remove = nullb and hunk.startb == 0 and hunk.lenb == 0

1725

abase, afile = pathtransform(afile_orig, strip, prefix)

1726

abase, afile = pathtransform(afile_orig, strip, prefix)

1726

gooda = not nulla and backend.exists(afile)

1727

gooda = not nulla and backend.exists(afile)

1727

bbase, bfile = pathtransform(bfile_orig, strip, prefix)

1728

bbase, bfile = pathtransform(bfile_orig, strip, prefix)

1728

if afile == bfile:

1729

if afile == bfile:

1729

goodb = gooda

1730

goodb = gooda

1730

else:

1731

else:

1731

goodb = not nullb and backend.exists(bfile)

1732

goodb = not nullb and backend.exists(bfile)

1732

missing = not goodb and not gooda and not create

1733

missing = not goodb and not gooda and not create

1733

1734

# some diff programs apparently produce patches where the afile is

1735

# some diff programs apparently produce patches where the afile is

1735

# not /dev/null, but afile starts with bfile

1736

# not /dev/null, but afile starts with bfile

1736

abasedir = afile[:afile.rfind('/') + 1]

1737

abasedir = afile[:afile.rfind('/') + 1]

1737

bbasedir = bfile[:bfile.rfind('/') + 1]

1738

bbasedir = bfile[:bfile.rfind('/') + 1]

1738

if (missing and abasedir == bbasedir and afile.startswith(bfile)

1739

if (missing and abasedir == bbasedir and afile.startswith(bfile)

1739

and hunk.starta == 0 and hunk.lena == 0):

1740

and hunk.starta == 0 and hunk.lena == 0):

1740

create = True

1741

create = True

1741

missing = False

1742

missing = False

1742

1743

# If afile is "a/b/foo" and bfile is "a/b/foo.orig" we assume the

1744

# If afile is "a/b/foo" and bfile is "a/b/foo.orig" we assume the

1744

# diff is between a file and its backup. In this case, the original

1745

# diff is between a file and its backup. In this case, the original

1745

# file should be patched (see original mpatch code).

1746

# file should be patched (see original mpatch code).

1746

isbackup = (abase == bbase and bfile.startswith(afile))

1747

isbackup = (abase == bbase and bfile.startswith(afile))

1747

fname = None

1748

fname = None

1748

if not missing:

1749

if not missing:

1749

if gooda and goodb:

1750

if gooda and goodb:

1750

if isbackup:

1751

if isbackup:

1751

fname = afile

1752

fname = afile

1752

else:

1753

else:

1753

fname = bfile

1754

fname = bfile

1754

elif gooda:

1755

elif gooda:

1755

fname = afile

1756

fname = afile

1756

1757

if not fname:

1758

if not fname:

1758

if not nullb:

1759

if not nullb:

1759

if isbackup:

1760

if isbackup:

1760

fname = afile

1761

fname = afile

1761

else:

1762

else:

1762

fname = bfile

1763

fname = bfile

1763

elif not nulla:

1764

elif not nulla:

1764

fname = afile

1765

fname = afile

1765

else:

1766

else:

1766

raise PatchError(_("undefined source and destination files"))

1767

raise PatchError(_("undefined source and destination files"))

1767

1768

gp = patchmeta(fname)

1769

gp = patchmeta(fname)

1769

if create:

1770

if create:

1770

gp.op = 'ADD'

1771

gp.op = 'ADD'

1771

elif remove:

1772

elif remove:

1772

gp.op = 'DELETE'

1773

gp.op = 'DELETE'

1773

return gp

1774

return gp

1774

1775

def scanpatch(fp):

1776

def scanpatch(fp):

1776

"""like patch.iterhunks, but yield different events

1777

"""like patch.iterhunks, but yield different events

1777

1778

- ('file', [header_lines + fromfile + tofile])

1779

- ('file', [header_lines + fromfile + tofile])

1779

- ('context', [context_lines])

1780

- ('context', [context_lines])

1780

- ('hunk', [hunk_lines])

1781

- ('hunk', [hunk_lines])

1781

- ('range', (-start,len, +start,len, proc))

1782

- ('range', (-start,len, +start,len, proc))

1782

"""

1783

"""

1783

lines_re = re.compile(br'@@ -(\d+),(\d+) \+(\d+),(\d+) @@\s*(.*)')

1784

lines_re = re.compile(br'@@ -(\d+),(\d+) \+(\d+),(\d+) @@\s*(.*)')

1784

lr = linereader(fp)

1785

lr = linereader(fp)

1785

1786

def scanwhile(first, p):

1787

def scanwhile(first, p):

1787

"""scan lr while predicate holds"""

1788

"""scan lr while predicate holds"""

1788

lines = [first]

1789

lines = [first]

1789

for line in iter(lr.readline, ''):

1790

for line in iter(lr.readline, ''):

1790

if p(line):

1791

if p(line):

1791

lines.append(line)

1792

lines.append(line)

1792

else:

1793

else:

1793

lr.push(line)

1794

lr.push(line)

1794

break

1795

break

1795

return lines

1796

return lines

1796

1797

for line in iter(lr.readline, ''):

1798

for line in iter(lr.readline, ''):

1798

if line.startswith('diff --git a/') or line.startswith('diff -r '):

1799

if line.startswith('diff --git a/') or line.startswith('diff -r '):

1799

def notheader(line):

1800

def notheader(line):

1800

s = line.split(None, 1)

1801

s = line.split(None, 1)

1801

return not s or s[0] not in ('---', 'diff')

1802

return not s or s[0] not in ('---', 'diff')

1802

header = scanwhile(line, notheader)

1803

header = scanwhile(line, notheader)

1803

fromfile = lr.readline()

1804

fromfile = lr.readline()

1804

if fromfile.startswith('---'):

1805

if fromfile.startswith('---'):

1805

tofile = lr.readline()

1806

tofile = lr.readline()

1806

header += [fromfile, tofile]

1807

header += [fromfile, tofile]

1807

else:

1808

else:

1808

lr.push(fromfile)

1809

lr.push(fromfile)

1809

yield 'file', header

1810

yield 'file', header

1810

elif line.startswith(' '):

1811

elif line.startswith(' '):

1811

cs = (' ', '\\')

1812

cs = (' ', '\\')

1812

yield 'context', scanwhile(line, lambda l: l.startswith(cs))

1813

yield 'context', scanwhile(line, lambda l: l.startswith(cs))

1813

elif line.startswith(('-', '+')):

1814

elif line.startswith(('-', '+')):

1814

cs = ('-', '+', '\\')

1815

cs = ('-', '+', '\\')

1815

yield 'hunk', scanwhile(line, lambda l: l.startswith(cs))

1816

yield 'hunk', scanwhile(line, lambda l: l.startswith(cs))

1816

else:

1817

else:

1817

m = lines_re.match(line)

1818

m = lines_re.match(line)

1818

if m:

1819

if m:

1819

yield 'range', m.groups()

1820

yield 'range', m.groups()

1820

else:

1821

else:

1821

yield 'other', line

1822

yield 'other', line

1822

1823

def scangitpatch(lr, firstline):

1824

def scangitpatch(lr, firstline):

1824

"""

1825

"""

1825

Git patches can emit:

1826

Git patches can emit:

1826

- rename a to b

1827

- rename a to b

1827

- change b

1828

- change b

1828

- copy a to c

1829

- copy a to c

1829

- change c

1830

- change c

1830

1831

We cannot apply this sequence as-is, the renamed 'a' could not be

1832

We cannot apply this sequence as-is, the renamed 'a' could not be

1832

found for it would have been renamed already. And we cannot copy

1833

found for it would have been renamed already. And we cannot copy

1833

from 'b' instead because 'b' would have been changed already. So

1834

from 'b' instead because 'b' would have been changed already. So

1834

we scan the git patch for copy and rename commands so we can

1835

we scan the git patch for copy and rename commands so we can

1835

perform the copies ahead of time.

1836

perform the copies ahead of time.

1836

"""

1837

"""

1837

pos = 0

1838

pos = 0

1838

try:

1839

try:

1839

pos = lr.fp.tell()

1840

pos = lr.fp.tell()

1840

fp = lr.fp

1841

fp = lr.fp

1841

except IOError:

1842

except IOError:

1842

fp = stringio(lr.fp.read())

1843

fp = stringio(lr.fp.read())

1843

gitlr = linereader(fp)

1844

gitlr = linereader(fp)

1844

gitlr.push(firstline)

1845

gitlr.push(firstline)

1845

gitpatches = readgitpatch(gitlr)

1846

gitpatches = readgitpatch(gitlr)

1846

fp.seek(pos)

1847

fp.seek(pos)

1847

return gitpatches

1848

return gitpatches

1848

1849

def iterhunks(fp):

1850

def iterhunks(fp):

1850

"""Read a patch and yield the following events:

1851

"""Read a patch and yield the following events:

1851

- ("file", afile, bfile, firsthunk): select a new target file.

1852

- ("file", afile, bfile, firsthunk): select a new target file.

1852

- ("hunk", hunk): a new hunk is ready to be applied, follows a

1853

- ("hunk", hunk): a new hunk is ready to be applied, follows a

1853

"file" event.

1854

"file" event.

1854

- ("git", gitchanges): current diff is in git format, gitchanges

1855

- ("git", gitchanges): current diff is in git format, gitchanges

1855

maps filenames to gitpatch records. Unique event.

1856

maps filenames to gitpatch records. Unique event.

1856

"""

1857

"""

1857

afile = ""

1858

afile = ""

1858

bfile = ""

1859

bfile = ""

1859

state = None

1860

state = None

1860

hunknum = 0

1861

hunknum = 0

1861

emitfile = newfile = False

1862

emitfile = newfile = False

1862

gitpatches = None

1863

gitpatches = None

1863

1864

# our states

1865

# our states

1865

BFILE = 1

1866

BFILE = 1

1866

context = None

1867

context = None

1867

lr = linereader(fp)

1868

lr = linereader(fp)

1868

1869

for x in iter(lr.readline, ''):

1870

for x in iter(lr.readline, ''):

1870

if state == BFILE and (

1871

if state == BFILE and (

1871

(not context and x.startswith('@'))

1872

(not context and x.startswith('@'))

1872

or (context is not False and x.startswith('***************'))

1873

or (context is not False and x.startswith('***************'))

1873

or x.startswith('GIT binary patch')):

1874

or x.startswith('GIT binary patch')):

1874

gp = None

1875

gp = None

1875

if (gitpatches and

1876

if (gitpatches and

1876

gitpatches[-1].ispatching(afile, bfile)):

1877

gitpatches[-1].ispatching(afile, bfile)):

1877

gp = gitpatches.pop()

1878

gp = gitpatches.pop()

1878

if x.startswith('GIT binary patch'):

1879

if x.startswith('GIT binary patch'):

1879

h = binhunk(lr, gp.path)

1880

h = binhunk(lr, gp.path)

1880

else:

1881

else:

1881

if context is None and x.startswith('***************'):

1882

if context is None and x.startswith('***************'):

1882

context = True

1883

context = True

1883

h = hunk(x, hunknum + 1, lr, context)

1884

h = hunk(x, hunknum + 1, lr, context)

1884

hunknum += 1

1885

hunknum += 1

1885

if emitfile:

1886

if emitfile:

1886

emitfile = False

1887

emitfile = False

1887

yield 'file', (afile, bfile, h, gp and gp.copy() or None)

1888

yield 'file', (afile, bfile, h, gp and gp.copy() or None)

1888

yield 'hunk', h

1889

yield 'hunk', h

1889

elif x.startswith('diff --git a/'):

1890

elif x.startswith('diff --git a/'):

1890

m = gitre.match(x.rstrip(' \r\n'))

1891

m = gitre.match(x.rstrip(' \r\n'))

1891

if not m:

1892

if not m:

1892

continue

1893

continue

1893

if gitpatches is None:

1894

if gitpatches is None:

1894

# scan whole input for git metadata

1895

# scan whole input for git metadata

1895

gitpatches = scangitpatch(lr, x)

1896

gitpatches = scangitpatch(lr, x)

1896

yield 'git', [g.copy() for g in gitpatches

1897

yield 'git', [g.copy() for g in gitpatches

1897

if g.op in ('COPY', 'RENAME')]

1898

if g.op in ('COPY', 'RENAME')]

1898

gitpatches.reverse()

1899

gitpatches.reverse()

1899

afile = 'a/' + m.group(1)

1900

afile = 'a/' + m.group(1)

1900

bfile = 'b/' + m.group(2)

1901

bfile = 'b/' + m.group(2)

1901

while gitpatches and not gitpatches[-1].ispatching(afile, bfile):

1902

while gitpatches and not gitpatches[-1].ispatching(afile, bfile):

1902

gp = gitpatches.pop()

1903

gp = gitpatches.pop()

1903

yield 'file', ('a/' + gp.path, 'b/' + gp.path, None, gp.copy())

1904

yield 'file', ('a/' + gp.path, 'b/' + gp.path, None, gp.copy())

1904

if not gitpatches:

1905

if not gitpatches:

1905

raise PatchError(_('failed to synchronize metadata for "%s"')

1906

raise PatchError(_('failed to synchronize metadata for "%s"')

1906

% afile[2:])

1907

% afile[2:])

1907

newfile = True

1908

newfile = True

1908

elif x.startswith('---'):

1909

elif x.startswith('---'):

1909

# check for a unified diff

1910

# check for a unified diff

1910

l2 = lr.readline()

1911

l2 = lr.readline()

1911

if not l2.startswith('+++'):

1912

if not l2.startswith('+++'):

1912

lr.push(l2)

1913

lr.push(l2)

1913

continue

1914

continue

1914

newfile = True

1915

newfile = True

1915

context = False

1916

context = False

1916

afile = parsefilename(x)

1917

afile = parsefilename(x)

1917

bfile = parsefilename(l2)

1918

bfile = parsefilename(l2)

1918

elif x.startswith('***'):

1919

elif x.startswith('***'):

1919

# check for a context diff

1920

# check for a context diff

1920

l2 = lr.readline()

1921

l2 = lr.readline()

1921

if not l2.startswith('---'):

1922

if not l2.startswith('---'):

1922

lr.push(l2)

1923

lr.push(l2)

1923

continue

1924

continue

1924

l3 = lr.readline()

1925

l3 = lr.readline()

1925

lr.push(l3)

1926

lr.push(l3)

1926

if not l3.startswith("***************"):

1927

if not l3.startswith("***************"):

1927

lr.push(l2)

1928

lr.push(l2)

1928

continue

1929

continue

1929

newfile = True

1930

newfile = True

1930

context = True

1931

context = True

1931

afile = parsefilename(x)

1932

afile = parsefilename(x)

1932

bfile = parsefilename(l2)

1933

bfile = parsefilename(l2)

1933

1934

if newfile:

1935

if newfile:

1935

newfile = False

1936

newfile = False

1936

emitfile = True

1937

emitfile = True

1937

state = BFILE

1938

state = BFILE

1938

hunknum = 0

1939

hunknum = 0

1939

1940

while gitpatches:

1941

while gitpatches:

1941

gp = gitpatches.pop()

1942

gp = gitpatches.pop()

1942

yield 'file', ('a/' + gp.path, 'b/' + gp.path, None, gp.copy())

1943

yield 'file', ('a/' + gp.path, 'b/' + gp.path, None, gp.copy())

1943

1944

def applybindelta(binchunk, data):

1945

def applybindelta(binchunk, data):

1945

"""Apply a binary delta hunk

1946

"""Apply a binary delta hunk

1946

The algorithm used is the algorithm from git's patch-delta.c

1947

The algorithm used is the algorithm from git's patch-delta.c

1947

"""

1948

"""

1948

def deltahead(binchunk):

1949

def deltahead(binchunk):

1949

i = 0

1950

i = 0

1950

for c in pycompat.bytestr(binchunk):

1951

for c in pycompat.bytestr(binchunk):

1951

i += 1

1952

i += 1

1952

if not (ord(c) & 0x80):

1953

if not (ord(c) & 0x80):

1953

return i

1954

return i

1954

return i

1955

return i

1955

out = ""

1956

out = ""

1956

s = deltahead(binchunk)

1957

s = deltahead(binchunk)

1957

binchunk = binchunk[s:]

1958

binchunk = binchunk[s:]

1958

s = deltahead(binchunk)

1959

s = deltahead(binchunk)

1959

binchunk = binchunk[s:]

1960

binchunk = binchunk[s:]

1960

i = 0

1961

i = 0

1961

while i < len(binchunk):

1962

while i < len(binchunk):

1962

cmd = ord(binchunk[i:i + 1])

1963

cmd = ord(binchunk[i:i + 1])

1963

i += 1

1964

i += 1

1964

if (cmd & 0x80):

1965

if (cmd & 0x80):

1965

offset = 0

1966

offset = 0

1966

size = 0

1967

size = 0

1967

if (cmd & 0x01):

1968

if (cmd & 0x01):

1968

offset = ord(binchunk[i:i + 1])

1969

offset = ord(binchunk[i:i + 1])

1969

i += 1

1970

i += 1

1970

if (cmd & 0x02):

1971

if (cmd & 0x02):

1971

offset |= ord(binchunk[i:i + 1]) << 8

1972

offset |= ord(binchunk[i:i + 1]) << 8

1972

i += 1

1973

i += 1

1973

if (cmd & 0x04):

1974

if (cmd & 0x04):

1974

offset |= ord(binchunk[i:i + 1]) << 16

1975

offset |= ord(binchunk[i:i + 1]) << 16

1975

i += 1

1976

i += 1

1976

if (cmd & 0x08):

1977

if (cmd & 0x08):

1977

offset |= ord(binchunk[i:i + 1]) << 24

1978

offset |= ord(binchunk[i:i + 1]) << 24

1978

i += 1

1979

i += 1

1979

if (cmd & 0x10):

1980

if (cmd & 0x10):

1980

size = ord(binchunk[i:i + 1])

1981

size = ord(binchunk[i:i + 1])

1981

i += 1

1982

i += 1

1982

if (cmd & 0x20):

1983

if (cmd & 0x20):

1983

size |= ord(binchunk[i:i + 1]) << 8

1984

size |= ord(binchunk[i:i + 1]) << 8

1984

i += 1

1985

i += 1

1985

if (cmd & 0x40):

1986

if (cmd & 0x40):

1986

size |= ord(binchunk[i:i + 1]) << 16

1987

size |= ord(binchunk[i:i + 1]) << 16

1987

i += 1

1988

i += 1

1988

if size == 0:

1989

if size == 0:

1989

size = 0x10000

1990

size = 0x10000

1990

offset_end = offset + size

1991

offset_end = offset + size

1991

out += data[offset:offset_end]

1992

out += data[offset:offset_end]

1992

elif cmd != 0:

1993

elif cmd != 0:

1993

offset_end = i + cmd

1994

offset_end = i + cmd

1994

out += binchunk[i:offset_end]

1995

out += binchunk[i:offset_end]

1995

i += cmd

1996

i += cmd

1996

else:

1997

else:

1997

raise PatchError(_('unexpected delta opcode 0'))

1998

raise PatchError(_('unexpected delta opcode 0'))

1998

return out

1999

return out

1999

2000

def applydiff(ui, fp, backend, store, strip=1, prefix='', eolmode='strict'):

2001

def applydiff(ui, fp, backend, store, strip=1, prefix='', eolmode='strict'):

2001

"""Reads a patch from fp and tries to apply it.

2002

"""Reads a patch from fp and tries to apply it.

2002

2003

Returns 0 for a clean patch, -1 if any rejects were found and 1 if

2004

Returns 0 for a clean patch, -1 if any rejects were found and 1 if

2004

there was any fuzz.

2005

there was any fuzz.

2005

2006

If 'eolmode' is 'strict', the patch content and patched file are

2007

If 'eolmode' is 'strict', the patch content and patched file are

2007

read in binary mode. Otherwise, line endings are ignored when

2008

read in binary mode. Otherwise, line endings are ignored when

2008

patching then normalized according to 'eolmode'.

2009

patching then normalized according to 'eolmode'.

2009

"""

2010

"""

2010

return _applydiff(ui, fp, patchfile, backend, store, strip=strip,

2011

return _applydiff(ui, fp, patchfile, backend, store, strip=strip,

2011

prefix=prefix, eolmode=eolmode)

2012

prefix=prefix, eolmode=eolmode)

2012

2013

def _canonprefix(repo, prefix):

2014

def _canonprefix(repo, prefix):

2014

if prefix:

2015

if prefix:

2015

prefix = pathutil.canonpath(repo.root, repo.getcwd(), prefix)

2016

prefix = pathutil.canonpath(repo.root, repo.getcwd(), prefix)

2016

if prefix != '':

2017

if prefix != '':

2017

prefix += '/'

2018

prefix += '/'

2018

return prefix

2019

return prefix

2019

2020

def _applydiff(ui, fp, patcher, backend, store, strip=1, prefix='',

2021

def _applydiff(ui, fp, patcher, backend, store, strip=1, prefix='',

2021

eolmode='strict'):

2022

eolmode='strict'):

2022

prefix = _canonprefix(backend.repo, prefix)

2023

prefix = _canonprefix(backend.repo, prefix)

2023

def pstrip(p):

2024

def pstrip(p):

2024

return pathtransform(p, strip - 1, prefix)[1]

2025

return pathtransform(p, strip - 1, prefix)[1]

2025

2026

rejects = 0

2027

rejects = 0

2027

err = 0

2028

err = 0

2028

current_file = None

2029

current_file = None

2029

2030

for state, values in iterhunks(fp):

2031

for state, values in iterhunks(fp):

2031

if state == 'hunk':

2032

if state == 'hunk':

2032

if not current_file:

2033

if not current_file:

2033

continue

2034

continue

2034

ret = current_file.apply(values)

2035

ret = current_file.apply(values)

2035

if ret > 0:

2036

if ret > 0:

2036

err = 1

2037

err = 1

2037

elif state == 'file':

2038

elif state == 'file':

2038

if current_file:

2039

if current_file:

2039

rejects += current_file.close()

2040

rejects += current_file.close()

2040

current_file = None

2041

current_file = None

2041

afile, bfile, first_hunk, gp = values

2042

afile, bfile, first_hunk, gp = values

2042

if gp:

2043

if gp:

2043

gp.path = pstrip(gp.path)

2044

gp.path = pstrip(gp.path)

2044

if gp.oldpath:

2045

if gp.oldpath:

2045

gp.oldpath = pstrip(gp.oldpath)

2046

gp.oldpath = pstrip(gp.oldpath)

2046

else:

2047

else:

2047

gp = makepatchmeta(backend, afile, bfile, first_hunk, strip,

2048

gp = makepatchmeta(backend, afile, bfile, first_hunk, strip,

2048

prefix)

2049

prefix)

2049

if gp.op == 'RENAME':

2050

if gp.op == 'RENAME':

2050

backend.unlink(gp.oldpath)

2051

backend.unlink(gp.oldpath)

2051

if not first_hunk:

2052

if not first_hunk:

2052

if gp.op == 'DELETE':

2053

if gp.op == 'DELETE':

2053

backend.unlink(gp.path)

2054

backend.unlink(gp.path)

2054

continue

2055

continue

2055

data, mode = None, None

2056

data, mode = None, None

2056

if gp.op in ('RENAME', 'COPY'):

2057

if gp.op in ('RENAME', 'COPY'):

2057

data, mode = store.getfile(gp.oldpath)[:2]

2058

data, mode = store.getfile(gp.oldpath)[:2]

2058

if data is None:

2059

if data is None:

2059

# This means that the old path does not exist

2060

# This means that the old path does not exist

2060

raise PatchError(_("source file '%s' does not exist")

2061

raise PatchError(_("source file '%s' does not exist")

2061

% gp.oldpath)

2062

% gp.oldpath)

2062

if gp.mode:

2063

if gp.mode:

2063

mode = gp.mode

2064

mode = gp.mode

2064

if gp.op == 'ADD':

2065

if gp.op == 'ADD':

2065

# Added files without content have no hunk and

2066

# Added files without content have no hunk and

2066

# must be created

2067

# must be created

2067

data = ''

2068

data = ''

2068

if data or mode:

2069

if data or mode:

2069

if (gp.op in ('ADD', 'RENAME', 'COPY')

2070

if (gp.op in ('ADD', 'RENAME', 'COPY')

2070

and backend.exists(gp.path)):

2071

and backend.exists(gp.path)):

2071

raise PatchError(_("cannot create %s: destination "

2072

raise PatchError(_("cannot create %s: destination "

2072

"already exists") % gp.path)

2073

"already exists") % gp.path)

2073

backend.setfile(gp.path, data, mode, gp.oldpath)

2074

backend.setfile(gp.path, data, mode, gp.oldpath)

2074

continue

2075

continue

2075

try:

2076

try:

2076

current_file = patcher(ui, gp, backend, store,

2077

current_file = patcher(ui, gp, backend, store,

2077

eolmode=eolmode)

2078

eolmode=eolmode)

2078

except PatchError as inst:

2079

except PatchError as inst:

2079

ui.warn(str(inst) + '\n')

2080

ui.warn(str(inst) + '\n')

2080

current_file = None

2081

current_file = None

2081

rejects += 1

2082

rejects += 1

2082

continue

2083

continue

2083

elif state == 'git':

2084

elif state == 'git':

2084

for gp in values:

2085

for gp in values:

2085

path = pstrip(gp.oldpath)

2086

path = pstrip(gp.oldpath)

2086

data, mode = backend.getfile(path)

2087

data, mode = backend.getfile(path)

2087

if data is None:

2088

if data is None:

2088

# The error ignored here will trigger a getfile()

2089

# The error ignored here will trigger a getfile()

2089

# error in a place more appropriate for error

2090

# error in a place more appropriate for error

2090

# handling, and will not interrupt the patching

2091

# handling, and will not interrupt the patching

2091

# process.

2092

# process.

2092

pass

2093

pass

2093

else:

2094

else:

2094

store.setfile(path, data, mode)

2095

store.setfile(path, data, mode)

2095

else:

2096

else:

2096

raise error.Abort(_('unsupported parser state: %s') % state)

2097

raise error.Abort(_('unsupported parser state: %s') % state)

2097

2098

if current_file:

2099

if current_file:

2099

rejects += current_file.close()

2100

rejects += current_file.close()

2100

2101

if rejects:

2102

if rejects:

2102

return -1

2103

return -1

2103

return err

2104

return err

2104

2105

def _externalpatch(ui, repo, patcher, patchname, strip, files,

2106

def _externalpatch(ui, repo, patcher, patchname, strip, files,

2106

similarity):

2107

similarity):

2107

"""use <patcher> to apply <patchname> to the working directory.

2108

"""use <patcher> to apply <patchname> to the working directory.

2108

returns whether patch was applied with fuzz factor."""

2109

returns whether patch was applied with fuzz factor."""

2109

2110

fuzz = False

2111

fuzz = False

2111

args = []

2112

args = []

2112

cwd = repo.root

2113

cwd = repo.root

2113

if cwd:

2114

if cwd:

2114

args.append('-d %s' % procutil.shellquote(cwd))

2115

args.append('-d %s' % procutil.shellquote(cwd))

2115

cmd = ('%s %s -p%d < %s'

2116

cmd = ('%s %s -p%d < %s'

2116

% (patcher, ' '.join(args), strip, procutil.shellquote(patchname)))

2117

% (patcher, ' '.join(args), strip, procutil.shellquote(patchname)))

2117

ui.debug('Using external patch tool: %s\n' % cmd)

2118

ui.debug('Using external patch tool: %s\n' % cmd)

2118

fp = procutil.popen(cmd, 'rb')

2119

fp = procutil.popen(cmd, 'rb')

2119

try:

2120

try:

2120

for line in util.iterfile(fp):

2121

for line in util.iterfile(fp):

2121

line = line.rstrip()

2122

line = line.rstrip()

2122

ui.note(line + '\n')

2123

ui.note(line + '\n')

2123

if line.startswith('patching file '):

2124

if line.startswith('patching file '):

2124

pf = util.parsepatchoutput(line)

2125

pf = util.parsepatchoutput(line)

2125

printed_file = False

2126

printed_file = False

2126

files.add(pf)

2127

files.add(pf)

2127

elif line.find('with fuzz') >= 0:

2128

elif line.find('with fuzz') >= 0:

2128

fuzz = True

2129

fuzz = True

2129

if not printed_file:

2130

if not printed_file:

2130

ui.warn(pf + '\n')

2131

ui.warn(pf + '\n')

2131

printed_file = True

2132

printed_file = True

2132

ui.warn(line + '\n')

2133

ui.warn(line + '\n')

2133

elif line.find('saving rejects to file') >= 0:

2134

elif line.find('saving rejects to file') >= 0:

2134

ui.warn(line + '\n')

2135

ui.warn(line + '\n')

2135

elif line.find('FAILED') >= 0:

2136

elif line.find('FAILED') >= 0:

2136

if not printed_file:

2137

if not printed_file:

2137

ui.warn(pf + '\n')

2138

ui.warn(pf + '\n')

2138

printed_file = True

2139

printed_file = True

2139

ui.warn(line + '\n')

2140

ui.warn(line + '\n')

2140

finally:

2141

finally:

2141

if files:

2142

if files:

2142

scmutil.marktouched(repo, files, similarity)

2143

scmutil.marktouched(repo, files, similarity)

2143

code = fp.close()

2144

code = fp.close()

2144

if code:

2145

if code:

2145

raise PatchError(_("patch command failed: %s") %

2146

raise PatchError(_("patch command failed: %s") %

2146

procutil.explainexit(code))

2147

procutil.explainexit(code))

2147

return fuzz

2148

return fuzz

2148

2149

def patchbackend(ui, backend, patchobj, strip, prefix, files=None,

2150

def patchbackend(ui, backend, patchobj, strip, prefix, files=None,

2150

eolmode='strict'):

2151

eolmode='strict'):

2151

if files is None:

2152

if files is None:

2152

files = set()

2153

files = set()

2153

if eolmode is None:

2154

if eolmode is None:

2154

eolmode = ui.config('patch', 'eol')

2155

eolmode = ui.config('patch', 'eol')

2155

if eolmode.lower() not in eolmodes:

2156

if eolmode.lower() not in eolmodes:

2156

raise error.Abort(_('unsupported line endings type: %s') % eolmode)

2157

raise error.Abort(_('unsupported line endings type: %s') % eolmode)

2157

eolmode = eolmode.lower()

2158

eolmode = eolmode.lower()

2158

2159

store = filestore()

2160

store = filestore()

2160

try:

2161

try:

2161

fp = open(patchobj, 'rb')

2162

fp = open(patchobj, 'rb')

2162

except TypeError:

2163

except TypeError:

2163

fp = patchobj

2164

fp = patchobj

2164

try:

2165

try:

2165

ret = applydiff(ui, fp, backend, store, strip=strip, prefix=prefix,

2166

ret = applydiff(ui, fp, backend, store, strip=strip, prefix=prefix,

2166

eolmode=eolmode)

2167

eolmode=eolmode)

2167

finally:

2168

finally:

2168

if fp != patchobj:

2169

if fp != patchobj:

2169

fp.close()

2170

fp.close()

2170

files.update(backend.close())

2171

files.update(backend.close())

2171

store.close()

2172

store.close()

2172

if ret < 0:

2173

if ret < 0:

2173

raise PatchError(_('patch failed to apply'))

2174

raise PatchError(_('patch failed to apply'))

2174

return ret > 0

2175

return ret > 0

2175

2176

def internalpatch(ui, repo, patchobj, strip, prefix='', files=None,

2177

def internalpatch(ui, repo, patchobj, strip, prefix='', files=None,

2177

eolmode='strict', similarity=0):

2178

eolmode='strict', similarity=0):

2178

"""use builtin patch to apply <patchobj> to the working directory.

2179

"""use builtin patch to apply <patchobj> to the working directory.

2179

returns whether patch was applied with fuzz factor."""

2180

returns whether patch was applied with fuzz factor."""

2180

backend = workingbackend(ui, repo, similarity)

2181

backend = workingbackend(ui, repo, similarity)

2181

return patchbackend(ui, backend, patchobj, strip, prefix, files, eolmode)

2182

return patchbackend(ui, backend, patchobj, strip, prefix, files, eolmode)

2182

2183

def patchrepo(ui, repo, ctx, store, patchobj, strip, prefix, files=None,

2184

def patchrepo(ui, repo, ctx, store, patchobj, strip, prefix, files=None,

2184

eolmode='strict'):

2185

eolmode='strict'):

2185

backend = repobackend(ui, repo, ctx, store)

2186

backend = repobackend(ui, repo, ctx, store)

2186

return patchbackend(ui, backend, patchobj, strip, prefix, files, eolmode)

2187

return patchbackend(ui, backend, patchobj, strip, prefix, files, eolmode)

2187

2188

def patch(ui, repo, patchname, strip=1, prefix='', files=None, eolmode='strict',

2189

def patch(ui, repo, patchname, strip=1, prefix='', files=None, eolmode='strict',

2189

similarity=0):

2190

similarity=0):

2190

"""Apply <patchname> to the working directory.

2191

"""Apply <patchname> to the working directory.

2191

2192

'eolmode' specifies how end of lines should be handled. It can be:

2193

'eolmode' specifies how end of lines should be handled. It can be:

2193

- 'strict': inputs are read in binary mode, EOLs are preserved

2194

- 'strict': inputs are read in binary mode, EOLs are preserved

2194

- 'crlf': EOLs are ignored when patching and reset to CRLF

2195

- 'crlf': EOLs are ignored when patching and reset to CRLF

2195

- 'lf': EOLs are ignored when patching and reset to LF

2196

- 'lf': EOLs are ignored when patching and reset to LF

2196

- None: get it from user settings, default to 'strict'

2197

- None: get it from user settings, default to 'strict'

2197

'eolmode' is ignored when using an external patcher program.

2198

'eolmode' is ignored when using an external patcher program.

2198

2199

Returns whether patch was applied with fuzz factor.

2200

Returns whether patch was applied with fuzz factor.

2200

"""

2201

"""

2201

patcher = ui.config('ui', 'patch')

2202

patcher = ui.config('ui', 'patch')

2202

if files is None:

2203

if files is None:

2203

files = set()

2204

files = set()

2204

if patcher:

2205

if patcher:

2205

return _externalpatch(ui, repo, patcher, patchname, strip,

2206

return _externalpatch(ui, repo, patcher, patchname, strip,

2206

files, similarity)

2207

files, similarity)

2207

return internalpatch(ui, repo, patchname, strip, prefix, files, eolmode,

2208

return internalpatch(ui, repo, patchname, strip, prefix, files, eolmode,

2208

similarity)

2209

similarity)

2209

2210

def changedfiles(ui, repo, patchpath, strip=1, prefix=''):

2211

def changedfiles(ui, repo, patchpath, strip=1, prefix=''):

2211

backend = fsbackend(ui, repo.root)

2212

backend = fsbackend(ui, repo.root)

2212

prefix = _canonprefix(repo, prefix)

2213

prefix = _canonprefix(repo, prefix)

2213

with open(patchpath, 'rb') as fp:

2214

with open(patchpath, 'rb') as fp:

2214

changed = set()

2215

changed = set()

2215

for state, values in iterhunks(fp):

2216

for state, values in iterhunks(fp):

2216

if state == 'file':

2217

if state == 'file':

2217

afile, bfile, first_hunk, gp = values

2218

afile, bfile, first_hunk, gp = values

2218

if gp:

2219

if gp:

2219

gp.path = pathtransform(gp.path, strip - 1, prefix)[1]

2220

gp.path = pathtransform(gp.path, strip - 1, prefix)[1]

2220

if gp.oldpath:

2221

if gp.oldpath:

2221

gp.oldpath = pathtransform(gp.oldpath, strip - 1,

2222

gp.oldpath = pathtransform(gp.oldpath, strip - 1,

2222

prefix)[1]

2223

prefix)[1]

2223

else:

2224

else:

2224

gp = makepatchmeta(backend, afile, bfile, first_hunk, strip,

2225

gp = makepatchmeta(backend, afile, bfile, first_hunk, strip,

2225

prefix)

2226

prefix)

2226

changed.add(gp.path)

2227

changed.add(gp.path)

2227

if gp.op == 'RENAME':

2228

if gp.op == 'RENAME':

2228

changed.add(gp.oldpath)

2229

changed.add(gp.oldpath)

2229

elif state not in ('hunk', 'git'):

2230

elif state not in ('hunk', 'git'):

2230

raise error.Abort(_('unsupported parser state: %s') % state)

2231

raise error.Abort(_('unsupported parser state: %s') % state)

2231

return changed

2232

return changed

2232

2233

class GitDiffRequired(Exception):

2234

class GitDiffRequired(Exception):

2234

pass

2235

pass

2235

2236

diffopts = diffutil.diffallopts

2237

diffopts = diffutil.diffallopts

2237

diffallopts = diffutil.diffallopts

2238

diffallopts = diffutil.diffallopts

2238

difffeatureopts = diffutil.difffeatureopts

2239

difffeatureopts = diffutil.difffeatureopts

2239

2240

def diff(repo, node1=None, node2=None, match=None, changes=None,

2241

def diff(repo, node1=None, node2=None, match=None, changes=None,

2241

opts=None, losedatafn=None, pathfn=None, copy=None,

2242

opts=None, losedatafn=None, pathfn=None, copy=None,

2242

copysourcematch=None, hunksfilterfn=None):

2243

copysourcematch=None, hunksfilterfn=None):

2243

'''yields diff of changes to files between two nodes, or node and

2244

'''yields diff of changes to files between two nodes, or node and

2244

working directory.

2245

working directory.

2245

2246

if node1 is None, use first dirstate parent instead.

2247

if node1 is None, use first dirstate parent instead.

2247

if node2 is None, compare node1 with working directory.

2248

if node2 is None, compare node1 with working directory.

2248

2249

losedatafn(**kwarg) is a callable run when opts.upgrade=True and

2250

losedatafn(**kwarg) is a callable run when opts.upgrade=True and

2250

every time some change cannot be represented with the current

2251

every time some change cannot be represented with the current

2251

patch format. Return False to upgrade to git patch format, True to

2252

patch format. Return False to upgrade to git patch format, True to

2252

accept the loss or raise an exception to abort the diff. It is

2253

accept the loss or raise an exception to abort the diff. It is

2253

called with the name of current file being diffed as 'fn'. If set

2254

called with the name of current file being diffed as 'fn'. If set

2254

to None, patches will always be upgraded to git format when

2255

to None, patches will always be upgraded to git format when

2255

necessary.

2256

necessary.

2256

2257

prefix is a filename prefix that is prepended to all filenames on

2258

prefix is a filename prefix that is prepended to all filenames on

2258

display (used for subrepos).

2259

display (used for subrepos).

2259

2260

relroot, if not empty, must be normalized with a trailing /. Any match

2261

relroot, if not empty, must be normalized with a trailing /. Any match

2261

patterns that fall outside it will be ignored.

2262

patterns that fall outside it will be ignored.

2262

2263

copy, if not empty, should contain mappings {dst@y: src@x} of copy

2264

copy, if not empty, should contain mappings {dst@y: src@x} of copy

2264

information.

2265

information.

2265

2266

if copysourcematch is not None, then copy sources will be filtered by this

2267

if copysourcematch is not None, then copy sources will be filtered by this

2267

matcher

2268

matcher

2268

2269

hunksfilterfn, if not None, should be a function taking a filectx and

2270

hunksfilterfn, if not None, should be a function taking a filectx and

2270

hunks generator that may yield filtered hunks.

2271

hunks generator that may yield filtered hunks.

2271

'''

2272

'''

2272

if not node1 and not node2:

2273

if not node1 and not node2:

2273

node1 = repo.dirstate.p1()

2274

node1 = repo.dirstate.p1()

2274

2275

ctx1 = repo[node1]

2276

ctx1 = repo[node1]

2276

ctx2 = repo[node2]

2277

ctx2 = repo[node2]

2277

2278

for fctx1, fctx2, hdr, hunks in diffhunks(

2279

for fctx1, fctx2, hdr, hunks in diffhunks(

2279

repo, ctx1=ctx1, ctx2=ctx2, match=match, changes=changes, opts=opts,

2280

repo, ctx1=ctx1, ctx2=ctx2, match=match, changes=changes, opts=opts,

2280

losedatafn=losedatafn, pathfn=pathfn, copy=copy,

2281

losedatafn=losedatafn, pathfn=pathfn, copy=copy,

2281

copysourcematch=copysourcematch):

2282

copysourcematch=copysourcematch):

2282

if hunksfilterfn is not None:

2283

if hunksfilterfn is not None:

2283

# If the file has been removed, fctx2 is None; but this should

2284

# If the file has been removed, fctx2 is None; but this should

2284

# not occur here since we catch removed files early in

2285

# not occur here since we catch removed files early in

2285

# logcmdutil.getlinerangerevs() for 'hg log -L'.

2286

# logcmdutil.getlinerangerevs() for 'hg log -L'.

2286

assert fctx2 is not None, (

2287

assert fctx2 is not None, (

2287

'fctx2 unexpectly None in diff hunks filtering')

2288

'fctx2 unexpectly None in diff hunks filtering')

2288

hunks = hunksfilterfn(fctx2, hunks)

2289

hunks = hunksfilterfn(fctx2, hunks)

2289

text = ''.join(sum((list(hlines) for hrange, hlines in hunks), []))

2290

text = ''.join(sum((list(hlines) for hrange, hlines in hunks), []))

2290

if hdr and (text or len(hdr) > 1):

2291

if hdr and (text or len(hdr) > 1):

2291

yield '\n'.join(hdr) + '\n'

2292

yield '\n'.join(hdr) + '\n'

2292

if text:

2293

if text:

2293

yield text

2294

yield text

2294

2295

def diffhunks(repo, ctx1, ctx2, match=None, changes=None, opts=None,

2296

def diffhunks(repo, ctx1, ctx2, match=None, changes=None, opts=None,

2296

losedatafn=None, pathfn=None, copy=None, copysourcematch=None):

2297

losedatafn=None, pathfn=None, copy=None, copysourcematch=None):

2297

"""Yield diff of changes to files in the form of (`header`, `hunks`) tuples

2298

"""Yield diff of changes to files in the form of (`header`, `hunks`) tuples

2298

where `header` is a list of diff headers and `hunks` is an iterable of

2299

where `header` is a list of diff headers and `hunks` is an iterable of

2299

(`hunkrange`, `hunklines`) tuples.

2300

(`hunkrange`, `hunklines`) tuples.

2300

2301

See diff() for the meaning of parameters.

2302

See diff() for the meaning of parameters.

2302

"""

2303

"""

2303

2304

if opts is None:

2305

if opts is None:

2305

opts = mdiff.defaultopts

2306

opts = mdiff.defaultopts

2306

2307

def lrugetfilectx():

2308

def lrugetfilectx():

2308

cache = {}

2309

cache = {}

2309

order = collections.deque()

2310

order = collections.deque()

2310

def getfilectx(f, ctx):

2311

def getfilectx(f, ctx):

2311

fctx = ctx.filectx(f, filelog=cache.get(f))

2312

fctx = ctx.filectx(f, filelog=cache.get(f))

2312

if f not in cache:

2313

if f not in cache:

2313

if len(cache) > 20:

2314

if len(cache) > 20:

2314

del cache[order.popleft()]

2315

del cache[order.popleft()]

2315

cache[f] = fctx.filelog()

2316

cache[f] = fctx.filelog()

2316

else:

2317

else:

2317

order.remove(f)

2318

order.remove(f)

2318

order.append(f)

2319

order.append(f)

2319

return fctx

2320

return fctx

2320

return getfilectx

2321

return getfilectx

2321

getfilectx = lrugetfilectx()

2322

getfilectx = lrugetfilectx()

2322

2323

if not changes:

2324

if not changes:

2324

changes = ctx1.status(ctx2, match=match)

2325

changes = ctx1.status(ctx2, match=match)

2325

modified, added, removed = changes[:3]

2326

modified, added, removed = changes[:3]

2326

2327

if not modified and not added and not removed:

2328

if not modified and not added and not removed:

2328

return []

2329

return []

2329

2330

if repo.ui.debugflag:

2331

if repo.ui.debugflag:

2331

hexfunc = hex

2332

hexfunc = hex

2332

else:

2333

else:

2333

hexfunc = short

2334

hexfunc = short

2334

revs = [hexfunc(node) for node in [ctx1.node(), ctx2.node()] if node]

2335

revs = [hexfunc(node) for node in [ctx1.node(), ctx2.node()] if node]

2335

2336

if copy is None:

2337

if copy is None:

2337

copy = {}

2338

copy = {}

2338

if opts.git or opts.upgrade:

2339

if opts.git or opts.upgrade:

2339

copy = copies.pathcopies(ctx1, ctx2, match=match)

2340

copy = copies.pathcopies(ctx1, ctx2, match=match)

2340

2341

if copysourcematch:

2342

if copysourcematch:

2342

# filter out copies where source side isn't inside the matcher

2343

# filter out copies where source side isn't inside the matcher

2343

# (copies.pathcopies() already filtered out the destination)

2344

# (copies.pathcopies() already filtered out the destination)

2344

copy = {dst: src for dst, src in copy.iteritems()

2345

copy = {dst: src for dst, src in copy.iteritems()

2345

if copysourcematch(src)}

2346

if copysourcematch(src)}

2346

2347

modifiedset = set(modified)

2348

modifiedset = set(modified)

2348

addedset = set(added)

2349

addedset = set(added)

2349

removedset = set(removed)

2350

removedset = set(removed)

2350

for f in modified:

2351

for f in modified:

2351

if f not in ctx1:

2352

if f not in ctx1:

2352

# Fix up added, since merged-in additions appear as

2353

# Fix up added, since merged-in additions appear as

2353

# modifications during merges

2354

# modifications during merges

2354

modifiedset.remove(f)

2355

modifiedset.remove(f)

2355

addedset.add(f)

2356

addedset.add(f)

2356

for f in removed:

2357

for f in removed:

2357

if f not in ctx1:

2358

if f not in ctx1:

2358

# Merged-in additions that are then removed are reported as removed.

2359

# Merged-in additions that are then removed are reported as removed.

2359

# They are not in ctx1, so We don't want to show them in the diff.

2360

# They are not in ctx1, so We don't want to show them in the diff.

2360

removedset.remove(f)

2361

removedset.remove(f)

2361

modified = sorted(modifiedset)

2362

modified = sorted(modifiedset)

2362

added = sorted(addedset)

2363

added = sorted(addedset)

2363

removed = sorted(removedset)

2364

removed = sorted(removedset)

2364

for dst, src in list(copy.items()):

2365

for dst, src in list(copy.items()):

2365

if src not in ctx1:

2366

if src not in ctx1:

2366

# Files merged in during a merge and then copied/renamed are

2367

# Files merged in during a merge and then copied/renamed are

2367

# reported as copies. We want to show them in the diff as additions.

2368

# reported as copies. We want to show them in the diff as additions.

2368

del copy[dst]

2369

del copy[dst]

2369

2370

prefetchmatch = scmutil.matchfiles(

2371

prefetchmatch = scmutil.matchfiles(

2371

repo, list(modifiedset | addedset | removedset))

2372

repo, list(modifiedset | addedset | removedset))

2372

scmutil.prefetchfiles(repo, [ctx1.rev(), ctx2.rev()], prefetchmatch)

2373

scmutil.prefetchfiles(repo, [ctx1.rev(), ctx2.rev()], prefetchmatch)

2373

2374

def difffn(opts, losedata):

2375

def difffn(opts, losedata):

2375

return trydiff(repo, revs, ctx1, ctx2, modified, added, removed,

2376

return trydiff(repo, revs, ctx1, ctx2, modified, added, removed,

2376

copy, getfilectx, opts, losedata, pathfn)

2377

copy, getfilectx, opts, losedata, pathfn)

2377

if opts.upgrade and not opts.git:

2378

if opts.upgrade and not opts.git:

2378

try:

2379

try:

2379

def losedata(fn):

2380

def losedata(fn):

2380

if not losedatafn or not losedatafn(fn=fn):

2381

if not losedatafn or not losedatafn(fn=fn):

2381

raise GitDiffRequired

2382

raise GitDiffRequired

2382

# Buffer the whole output until we are sure it can be generated

2383

# Buffer the whole output until we are sure it can be generated

2383

return list(difffn(opts.copy(git=False), losedata))

2384

return list(difffn(opts.copy(git=False), losedata))

2384

except GitDiffRequired:

2385

except GitDiffRequired:

2385

return difffn(opts.copy(git=True), None)

2386

return difffn(opts.copy(git=True), None)

2386

else:

2387

else:

2387

return difffn(opts, None)

2388

return difffn(opts, None)

2388

2389

def diffsinglehunk(hunklines):

2390

def diffsinglehunk(hunklines):

2390

"""yield tokens for a list of lines in a single hunk"""

2391

"""yield tokens for a list of lines in a single hunk"""

2391

for line in hunklines:

2392

for line in hunklines:

2392

# chomp

2393

# chomp

2393

chompline = line.rstrip('\r\n')

2394

chompline = line.rstrip('\r\n')

2394

# highlight tabs and trailing whitespace

2395

# highlight tabs and trailing whitespace

2395

stripline = chompline.rstrip()

2396

stripline = chompline.rstrip()

2396

if line.startswith('-'):

2397

if line.startswith('-'):

2397

label = 'diff.deleted'

2398

label = 'diff.deleted'

2398

elif line.startswith('+'):

2399

elif line.startswith('+'):

2399

label = 'diff.inserted'

2400

label = 'diff.inserted'

2400

else:

2401

else:

2401

raise error.ProgrammingError('unexpected hunk line: %s' % line)

2402

raise error.ProgrammingError('unexpected hunk line: %s' % line)

2402

for token in tabsplitter.findall(stripline):

2403

for token in tabsplitter.findall(stripline):

2403

if token.startswith('\t'):

2404

if token.startswith('\t'):

2404

yield (token, 'diff.tab')

2405

yield (token, 'diff.tab')

2405

else:

2406

else:

2406

yield (token, label)

2407

yield (token, label)

2407

2408

if chompline != stripline:

2409

if chompline != stripline:

2409

yield (chompline[len(stripline):], 'diff.trailingwhitespace')

2410

yield (chompline[len(stripline):], 'diff.trailingwhitespace')

2410

if chompline != line:

2411

if chompline != line:

2411

yield (line[len(chompline):], '')

2412

yield (line[len(chompline):], '')

2412

2413

def diffsinglehunkinline(hunklines):

2414

def diffsinglehunkinline(hunklines):

2414

"""yield tokens for a list of lines in a single hunk, with inline colors"""

2415

"""yield tokens for a list of lines in a single hunk, with inline colors"""

2415

# prepare deleted, and inserted content

2416

# prepare deleted, and inserted content

2416

a = ''

2417

a = ''

2417

b = ''

2418

b = ''

2418

for line in hunklines:

2419

for line in hunklines:

2419

if line[0:1] == '-':

2420

if line[0:1] == '-':

2420

a += line[1:]

2421

a += line[1:]

2421

elif line[0:1] == '+':

2422

elif line[0:1] == '+':

2422

b += line[1:]

2423

b += line[1:]

2423

else:

2424

else:

2424

raise error.ProgrammingError('unexpected hunk line: %s' % line)

2425

raise error.ProgrammingError('unexpected hunk line: %s' % line)

2425

# fast path: if either side is empty, use diffsinglehunk

2426

# fast path: if either side is empty, use diffsinglehunk

2426

if not a or not b:

2427

if not a or not b:

2427

for t in diffsinglehunk(hunklines):

2428

for t in diffsinglehunk(hunklines):

2428

yield t

2429

yield t

2429

return

2430

return

2430

# re-split the content into words

2431

# re-split the content into words

2431

al = wordsplitter.findall(a)

2432

al = wordsplitter.findall(a)

2432

bl = wordsplitter.findall(b)

2433

bl = wordsplitter.findall(b)

2433

# re-arrange the words to lines since the diff algorithm is line-based

2434

# re-arrange the words to lines since the diff algorithm is line-based

2434

aln = [s if s == '\n' else s + '\n' for s in al]

2435

aln = [s if s == '\n' else s + '\n' for s in al]

2435

bln = [s if s == '\n' else s + '\n' for s in bl]

2436

bln = [s if s == '\n' else s + '\n' for s in bl]

2436

an = ''.join(aln)

2437

an = ''.join(aln)

2437

bn = ''.join(bln)

2438

bn = ''.join(bln)

2438

# run the diff algorithm, prepare atokens and btokens

2439

# run the diff algorithm, prepare atokens and btokens

2439

atokens = []

2440

atokens = []

2440

btokens = []

2441

btokens = []

2441

blocks = mdiff.allblocks(an, bn, lines1=aln, lines2=bln)

2442

blocks = mdiff.allblocks(an, bn, lines1=aln, lines2=bln)

2442

for (a1, a2, b1, b2), btype in blocks:

2443

for (a1, a2, b1, b2), btype in blocks:

2443

changed = btype == '!'

2444

changed = btype == '!'

2444

for token in mdiff.splitnewlines(''.join(al[a1:a2])):

2445

for token in mdiff.splitnewlines(''.join(al[a1:a2])):

2445

atokens.append((changed, token))

2446

atokens.append((changed, token))

2446

for token in mdiff.splitnewlines(''.join(bl[b1:b2])):

2447

for token in mdiff.splitnewlines(''.join(bl[b1:b2])):

2447

btokens.append((changed, token))

2448

btokens.append((changed, token))

2448

2449

# yield deleted tokens, then inserted ones

2450

# yield deleted tokens, then inserted ones

2450

for prefix, label, tokens in [('-', 'diff.deleted', atokens),

2451

for prefix, label, tokens in [('-', 'diff.deleted', atokens),

2451

('+', 'diff.inserted', btokens)]:

2452

('+', 'diff.inserted', btokens)]:

2452

nextisnewline = True

2453

nextisnewline = True

2453

for changed, token in tokens:

2454

for changed, token in tokens:

2454

if nextisnewline:

2455

if nextisnewline:

2455

yield (prefix, label)

2456

yield (prefix, label)

2456

nextisnewline = False

2457

nextisnewline = False

2457

# special handling line end

2458

# special handling line end

2458

isendofline = token.endswith('\n')

2459

isendofline = token.endswith('\n')

2459

if isendofline:

2460

if isendofline:

2460

chomp = token[:-1] # chomp

2461

chomp = token[:-1] # chomp

2461

if chomp.endswith('\r'):

2462

if chomp.endswith('\r'):

2462

chomp = chomp[:-1]

2463

chomp = chomp[:-1]

2463

endofline = token[len(chomp):]

2464

endofline = token[len(chomp):]

2464

token = chomp.rstrip() # detect spaces at the end

2465

token = chomp.rstrip() # detect spaces at the end

2465

endspaces = chomp[len(token):]

2466

endspaces = chomp[len(token):]

2466

# scan tabs

2467

# scan tabs

2467

for maybetab in tabsplitter.findall(token):

2468

for maybetab in tabsplitter.findall(token):

2468

if b'\t' == maybetab[0:1]:

2469

if b'\t' == maybetab[0:1]:

2469

currentlabel = 'diff.tab'

2470

currentlabel = 'diff.tab'

2470

else:

2471

else:

2471

if changed:

2472

if changed:

2472

currentlabel = label + '.changed'

2473

currentlabel = label + '.changed'

2473

else:

2474

else:

2474

currentlabel = label + '.unchanged'

2475

currentlabel = label + '.unchanged'

2475

yield (maybetab, currentlabel)

2476

yield (maybetab, currentlabel)

2476

if isendofline:

2477

if isendofline:

2477

if endspaces:

2478

if endspaces:

2478

yield (endspaces, 'diff.trailingwhitespace')

2479

yield (endspaces, 'diff.trailingwhitespace')

2479

yield (endofline, '')

2480

yield (endofline, '')

2480

nextisnewline = True

2481

nextisnewline = True

2481

2482

def difflabel(func, *args, **kw):

2483

def difflabel(func, *args, **kw):

2483

'''yields 2-tuples of (output, label) based on the output of func()'''

2484

'''yields 2-tuples of (output, label) based on the output of func()'''

2484

if kw.get(r'opts') and kw[r'opts'].worddiff:

2485

if kw.get(r'opts') and kw[r'opts'].worddiff:

2485

dodiffhunk = diffsinglehunkinline

2486

dodiffhunk = diffsinglehunkinline

2486

else:

2487

else:

2487

dodiffhunk = diffsinglehunk

2488

dodiffhunk = diffsinglehunk

2488

headprefixes = [('diff', 'diff.diffline'),

2489

headprefixes = [('diff', 'diff.diffline'),

2489

('copy', 'diff.extended'),

2490

('copy', 'diff.extended'),

2490

('rename', 'diff.extended'),

2491

('rename', 'diff.extended'),

2491

('old', 'diff.extended'),

2492

('old', 'diff.extended'),

2492

('new', 'diff.extended'),

2493

('new', 'diff.extended'),

2493

('deleted', 'diff.extended'),

2494

('deleted', 'diff.extended'),

2494

('index', 'diff.extended'),

2495

('index', 'diff.extended'),

2495

('similarity', 'diff.extended'),

2496

('similarity', 'diff.extended'),

2496

('---', 'diff.file_a'),

2497

('---', 'diff.file_a'),

2497

('+++', 'diff.file_b')]

2498

('+++', 'diff.file_b')]

2498

textprefixes = [('@', 'diff.hunk'),

2499

textprefixes = [('@', 'diff.hunk'),

2499

# - and + are handled by diffsinglehunk

2500

# - and + are handled by diffsinglehunk

2500

]

2501

]

2501

head = False

2502

head = False

2502

2503

# buffers a hunk, i.e. adjacent "-", "+" lines without other changes.

2504

# buffers a hunk, i.e. adjacent "-", "+" lines without other changes.

2504

hunkbuffer = []

2505

hunkbuffer = []

2505

def consumehunkbuffer():

2506

def consumehunkbuffer():

2506

if hunkbuffer:

2507

if hunkbuffer:

2507

for token in dodiffhunk(hunkbuffer):

2508

for token in dodiffhunk(hunkbuffer):

2508

yield token

2509

yield token

2509

hunkbuffer[:] = []

2510

hunkbuffer[:] = []

2510

2511

for chunk in func(*args, **kw):

2512

for chunk in func(*args, **kw):

2512

lines = chunk.split('\n')

2513

lines = chunk.split('\n')

2513

linecount = len(lines)

2514

linecount = len(lines)

2514

for i, line in enumerate(lines):

2515

for i, line in enumerate(lines):

2515

if head:

2516

if head:

2516

if line.startswith('@'):

2517

if line.startswith('@'):

2517

head = False

2518

head = False

2518

else:

2519

else:

2519

if line and not line.startswith((' ', '+', '-', '@', '\\')):

2520

if line and not line.startswith((' ', '+', '-', '@', '\\')):

2520

head = True

2521

head = True

2521

diffline = False

2522

diffline = False

2522

if not head and line and line.startswith(('+', '-')):

2523

if not head and line and line.startswith(('+', '-')):

2523

diffline = True

2524

diffline = True

2524

2525

prefixes = textprefixes

2526

prefixes = textprefixes

2526

if head:

2527

if head:

2527

prefixes = headprefixes

2528

prefixes = headprefixes

2528

if diffline:

2529

if diffline:

2529

# buffered

2530

# buffered

2530

bufferedline = line

2531

bufferedline = line

2531

if i + 1 < linecount:

2532

if i + 1 < linecount:

2532

bufferedline += "\n"

2533

bufferedline += "\n"

2533

hunkbuffer.append(bufferedline)

2534

hunkbuffer.append(bufferedline)

2534

else:

2535

else:

2535

# unbuffered

2536

# unbuffered

2536

for token in consumehunkbuffer():

2537

for token in consumehunkbuffer():

2537

yield token

2538

yield token

2538

stripline = line.rstrip()

2539

stripline = line.rstrip()

2539

for prefix, label in prefixes:

2540

for prefix, label in prefixes:

2540

if stripline.startswith(prefix):

2541

if stripline.startswith(prefix):

2541

yield (stripline, label)

2542

yield (stripline, label)

2542

if line != stripline:

2543

if line != stripline:

2543

yield (line[len(stripline):],

2544

yield (line[len(stripline):],

2544

'diff.trailingwhitespace')

2545

'diff.trailingwhitespace')

2545

break

2546

break

2546

else:

2547

else:

2547

yield (line, '')

2548

yield (line, '')

2548

if i + 1 < linecount:

2549

if i + 1 < linecount:

2549

yield ('\n', '')

2550

yield ('\n', '')

2550

for token in consumehunkbuffer():

2551

for token in consumehunkbuffer():

2551

yield token

2552

yield token

2552

2553

def diffui(*args, **kw):

2554

def diffui(*args, **kw):

2554

'''like diff(), but yields 2-tuples of (output, label) for ui.write()'''

2555

'''like diff(), but yields 2-tuples of (output, label) for ui.write()'''

2555

return difflabel(diff, *args, **kw)

2556

return difflabel(diff, *args, **kw)

2556

2557

def _filepairs(modified, added, removed, copy, opts):

2558

def _filepairs(modified, added, removed, copy, opts):

2558

'''generates tuples (f1, f2, copyop), where f1 is the name of the file

2559

'''generates tuples (f1, f2, copyop), where f1 is the name of the file

2559

before and f2 is the the name after. For added files, f1 will be None,

2560

before and f2 is the the name after. For added files, f1 will be None,

2560

and for removed files, f2 will be None. copyop may be set to None, 'copy'

2561

and for removed files, f2 will be None. copyop may be set to None, 'copy'

2561

or 'rename' (the latter two only if opts.git is set).'''

2562

or 'rename' (the latter two only if opts.git is set).'''

2562

gone = set()

2563

gone = set()

2563

2564

copyto = dict([(v, k) for k, v in copy.items()])

2565

copyto = dict([(v, k) for k, v in copy.items()])

2565

2566

addedset, removedset = set(added), set(removed)

2567

addedset, removedset = set(added), set(removed)

2567

2568

for f in sorted(modified + added + removed):

2569

for f in sorted(modified + added + removed):

2569

copyop = None

2570

copyop = None

2570

f1, f2 = f, f

2571

f1, f2 = f, f

2571

if f in addedset:

2572

if f in addedset:

2572

f1 = None

2573

f1 = None

2573

if f in copy:

2574

if f in copy:

2574

if opts.git:

2575

if opts.git:

2575

f1 = copy[f]

2576

f1 = copy[f]

2576

if f1 in removedset and f1 not in gone:

2577

if f1 in removedset and f1 not in gone:

2577

copyop = 'rename'

2578

copyop = 'rename'

2578

gone.add(f1)

2579

gone.add(f1)

2579

else:

2580

else:

2580

copyop = 'copy'

2581

copyop = 'copy'

2581

elif f in removedset:

2582

elif f in removedset:

2582

f2 = None

2583

f2 = None

2583

if opts.git:

2584

if opts.git:

2584

# have we already reported a copy above?

2585

# have we already reported a copy above?

2585

if (f in copyto and copyto[f] in addedset

2586

if (f in copyto and copyto[f] in addedset

2586

and copy[copyto[f]] == f):

2587

and copy[copyto[f]] == f):

2587

continue

2588

continue

2588

yield f1, f2, copyop

2589

yield f1, f2, copyop

2589

2590

def trydiff(repo, revs, ctx1, ctx2, modified, added, removed,

2591

def trydiff(repo, revs, ctx1, ctx2, modified, added, removed,

2591

copy, getfilectx, opts, losedatafn, pathfn):

2592

copy, getfilectx, opts, losedatafn, pathfn):

2592

'''given input data, generate a diff and yield it in blocks

2593

'''given input data, generate a diff and yield it in blocks

2593

2594

If generating a diff would lose data like flags or binary data and

2595

If generating a diff would lose data like flags or binary data and

2595

losedatafn is not None, it will be called.

2596

losedatafn is not None, it will be called.

2596

2597

pathfn is applied to every path in the diff output.

2598

pathfn is applied to every path in the diff output.

2598

'''

2599

'''

2599

2600

def gitindex(text):

2601

def gitindex(text):

2601

if not text:

2602

if not text:

2602

text = ""

2603

text = ""

2603

l = len(text)

2604

l = len(text)

2604

s = hashlib.sha1('blob %d\0' % l)

2605

s = hashlib.sha1('blob %d\0' % l)

2605

s.update(text)

2606

s.update(text)

2606

return hex(s.digest())

2607

return hex(s.digest())

2607

2608

if opts.noprefix:

2609

if opts.noprefix:

2609

aprefix = bprefix = ''

2610

aprefix = bprefix = ''

2610

else:

2611

else:

2611

aprefix = 'a/'

2612

aprefix = 'a/'

2612

bprefix = 'b/'

2613

bprefix = 'b/'

2613

2614

def diffline(f, revs):

2615

def diffline(f, revs):

2615

revinfo = ' '.join(["-r %s" % rev for rev in revs])

2616

revinfo = ' '.join(["-r %s" % rev for rev in revs])

2616

return 'diff %s %s' % (revinfo, f)

2617

return 'diff %s %s' % (revinfo, f)

2617

2618

def isempty(fctx):

2619

def isempty(fctx):

2619

return fctx is None or fctx.size() == 0

2620

return fctx is None or fctx.size() == 0

2620

2621

date1 = dateutil.datestr(ctx1.date())

2622

date1 = dateutil.datestr(ctx1.date())

2622

date2 = dateutil.datestr(ctx2.date())

2623

date2 = dateutil.datestr(ctx2.date())

2623

2624

gitmode = {'l': '120000', 'x': '100755', '': '100644'}

2625

gitmode = {'l': '120000', 'x': '100755', '': '100644'}

2625

2626

if not pathfn:

2627

if not pathfn:

2627

pathfn = lambda f: f

2628

pathfn = lambda f: f

2628

2629

for f1, f2, copyop in _filepairs(modified, added, removed, copy, opts):

2630

for f1, f2, copyop in _filepairs(modified, added, removed, copy, opts):

2630

content1 = None

2631

content1 = None

2631

content2 = None

2632

content2 = None

2632

fctx1 = None

2633

fctx1 = None

2633

fctx2 = None

2634

fctx2 = None

2634

flag1 = None

2635

flag1 = None

2635

flag2 = None

2636

flag2 = None

2636

if f1:

2637

if f1:

2637

fctx1 = getfilectx(f1, ctx1)

2638

fctx1 = getfilectx(f1, ctx1)

2638

if opts.git or losedatafn:

2639

if opts.git or losedatafn:

2639

flag1 = ctx1.flags(f1)

2640

flag1 = ctx1.flags(f1)

2640

if f2:

2641

if f2:

2641

fctx2 = getfilectx(f2, ctx2)

2642

fctx2 = getfilectx(f2, ctx2)

2642

if opts.git or losedatafn:

2643

if opts.git or losedatafn:

2643

flag2 = ctx2.flags(f2)

2644

flag2 = ctx2.flags(f2)

2644

# if binary is True, output "summary" or "base85", but not "text diff"

2645

# if binary is True, output "summary" or "base85", but not "text diff"

2645

if opts.text:

2646

if opts.text:

2646

binary = False

2647

binary = False

2647

else:

2648

else:

2648

binary = any(f.isbinary() for f in [fctx1, fctx2] if f is not None)

2649

binary = any(f.isbinary() for f in [fctx1, fctx2] if f is not None)

2649

2650

if losedatafn and not opts.git:

2651

if losedatafn and not opts.git:

2651

if (binary or

2652

if (binary or

2652

# copy/rename

2653

# copy/rename

2653

f2 in copy or

2654

f2 in copy or

2654

# empty file creation

2655

# empty file creation

2655

(not f1 and isempty(fctx2)) or

2656

(not f1 and isempty(fctx2)) or

2656

# empty file deletion

2657

# empty file deletion

2657

(isempty(fctx1) and not f2) or

2658

(isempty(fctx1) and not f2) or

2658

# create with flags

2659

# create with flags

2659

(not f1 and flag2) or

2660

(not f1 and flag2) or

2660

# change flags

2661

# change flags

2661

(f1 and f2 and flag1 != flag2)):

2662

(f1 and f2 and flag1 != flag2)):

2662

losedatafn(f2 or f1)

2663

losedatafn(f2 or f1)

2663

2664

path1 = pathfn(f1 or f2)

2665

path1 = pathfn(f1 or f2)

2665

path2 = pathfn(f2 or f1)

2666

path2 = pathfn(f2 or f1)

2666

header = []

2667

header = []

2667

if opts.git:

2668

if opts.git:

2668

header.append('diff --git %s%s %s%s' %

2669

header.append('diff --git %s%s %s%s' %

2669

(aprefix, path1, bprefix, path2))

2670

(aprefix, path1, bprefix, path2))

2670

if not f1: # added

2671

if not f1: # added

2671

header.append('new file mode %s' % gitmode[flag2])

2672

header.append('new file mode %s' % gitmode[flag2])

2672

elif not f2: # removed

2673

elif not f2: # removed

2673

header.append('deleted file mode %s' % gitmode[flag1])

2674

header.append('deleted file mode %s' % gitmode[flag1])

2674

else: # modified/copied/renamed

2675

else: # modified/copied/renamed

2675

mode1, mode2 = gitmode[flag1], gitmode[flag2]

2676

mode1, mode2 = gitmode[flag1], gitmode[flag2]

2676

if mode1 != mode2:

2677

if mode1 != mode2:

2677

header.append('old mode %s' % mode1)

2678

header.append('old mode %s' % mode1)

2678

header.append('new mode %s' % mode2)

2679

header.append('new mode %s' % mode2)

2679

if copyop is not None:

2680

if copyop is not None:

2680

if opts.showsimilarity:

2681

if opts.showsimilarity:

2681

sim = similar.score(ctx1[path1], ctx2[path2]) * 100

2682

sim = similar.score(ctx1[path1], ctx2[path2]) * 100

2682

header.append('similarity index %d%%' % sim)

2683

header.append('similarity index %d%%' % sim)

2683

header.append('%s from %s' % (copyop, path1))

2684

header.append('%s from %s' % (copyop, path1))

2684

header.append('%s to %s' % (copyop, path2))

2685

header.append('%s to %s' % (copyop, path2))

2685

elif revs:

2686

elif revs:

2686

header.append(diffline(path1, revs))

2687

header.append(diffline(path1, revs))

2687

2688

# fctx.is | diffopts | what to | is fctx.data()

2689

# fctx.is | diffopts | what to | is fctx.data()

2689

# binary() | text nobinary git index | output? | outputted?

2690

# binary() | text nobinary git index | output? | outputted?

2690

# ------------------------------------|----------------------------

2691

# ------------------------------------|----------------------------

2691

# yes | no no no * | summary | no

2692

# yes | no no no * | summary | no

2692

# yes | no no yes * | base85 | yes

2693

# yes | no no yes * | base85 | yes

2693

# yes | no yes no * | summary | no

2694

# yes | no yes no * | summary | no

2694

# yes | no yes yes 0 | summary | no

2695

# yes | no yes yes 0 | summary | no

2695

# yes | no yes yes >0 | summary | semi [1]

2696

# yes | no yes yes >0 | summary | semi [1]

2696

# yes | yes * * * | text diff | yes

2697

# yes | yes * * * | text diff | yes

2697

# no | * * * * | text diff | yes

2698

# no | * * * * | text diff | yes

2698

# [1]: hash(fctx.data()) is outputted. so fctx.data() cannot be faked

2699

# [1]: hash(fctx.data()) is outputted. so fctx.data() cannot be faked

2699

if binary and (not opts.git or (opts.git and opts.nobinary and not

2700

if binary and (not opts.git or (opts.git and opts.nobinary and not

2700

opts.index)):

2701

opts.index)):

2701

# fast path: no binary content will be displayed, content1 and

2702

# fast path: no binary content will be displayed, content1 and

2702

# content2 are only used for equivalent test. cmp() could have a

2703

# content2 are only used for equivalent test. cmp() could have a

2703

# fast path.

2704

# fast path.

2704

if fctx1 is not None:

2705

if fctx1 is not None:

2705

content1 = b'\0'

2706

content1 = b'\0'

2706

if fctx2 is not None:

2707

if fctx2 is not None:

2707

if fctx1 is not None and not fctx1.cmp(fctx2):

2708

if fctx1 is not None and not fctx1.cmp(fctx2):

2708

content2 = b'\0' # not different

2709

content2 = b'\0' # not different

2709

else:

2710

else:

2710

content2 = b'\0\0'

2711

content2 = b'\0\0'

2711

else:

2712

else:

2712

# normal path: load contents

2713

# normal path: load contents

2713

if fctx1 is not None:

2714

if fctx1 is not None:

2714

content1 = fctx1.data()

2715

content1 = fctx1.data()

2715

if fctx2 is not None:

2716

if fctx2 is not None:

2716

content2 = fctx2.data()

2717

content2 = fctx2.data()

2717

2718

if binary and opts.git and not opts.nobinary:

2719

if binary and opts.git and not opts.nobinary:

2719

text = mdiff.b85diff(content1, content2)

2720

text = mdiff.b85diff(content1, content2)

2720

if text:

2721

if text:

2721

header.append('index %s..%s' %

2722

header.append('index %s..%s' %

2722

(gitindex(content1), gitindex(content2)))

2723

(gitindex(content1), gitindex(content2)))

2723

hunks = (None, [text]),

2724

hunks = (None, [text]),

2724

else:

2725

else:

2725

if opts.git and opts.index > 0:

2726

if opts.git and opts.index > 0:

2726

flag = flag1

2727

flag = flag1

2727

if flag is None:

2728

if flag is None:

2728

flag = flag2

2729

flag = flag2

2729

header.append('index %s..%s %s' %

2730

header.append('index %s..%s %s' %

2730

(gitindex(content1)[0:opts.index],

2731

(gitindex(content1)[0:opts.index],

2731

gitindex(content2)[0:opts.index],

2732

gitindex(content2)[0:opts.index],

2732

gitmode[flag]))

2733

gitmode[flag]))

2733

2734

uheaders, hunks = mdiff.unidiff(content1, date1,

2735

uheaders, hunks = mdiff.unidiff(content1, date1,

2735

content2, date2,

2736

content2, date2,

2736

path1, path2,

2737

path1, path2,

2737

binary=binary, opts=opts)

2738

binary=binary, opts=opts)

2738

header.extend(uheaders)

2739

header.extend(uheaders)

2739

yield fctx1, fctx2, header, hunks

2740

yield fctx1, fctx2, header, hunks

2740

2741

def diffstatsum(stats):

2742

def diffstatsum(stats):

2742

maxfile, maxtotal, addtotal, removetotal, binary = 0, 0, 0, 0, False

2743

maxfile, maxtotal, addtotal, removetotal, binary = 0, 0, 0, 0, False

2743

for f, a, r, b in stats:

2744

for f, a, r, b in stats:

2744

maxfile = max(maxfile, encoding.colwidth(f))

2745

maxfile = max(maxfile, encoding.colwidth(f))

2745

maxtotal = max(maxtotal, a + r)

2746

maxtotal = max(maxtotal, a + r)

2746

addtotal += a

2747

addtotal += a

2747

removetotal += r

2748

removetotal += r

2748

binary = binary or b

2749

binary = binary or b

2749

2750

return maxfile, maxtotal, addtotal, removetotal, binary

2751

return maxfile, maxtotal, addtotal, removetotal, binary

2751

2752

def diffstatdata(lines):

2753

def diffstatdata(lines):

2753

diffre = re.compile(br'^diff .*-r [a-z0-9]+\s(.*)$')

2754

diffre = re.compile(br'^diff .*-r [a-z0-9]+\s(.*)$')

2754

2755

results = []

2756

results = []

2756

filename, adds, removes, isbinary = None, 0, 0, False

2757

filename, adds, removes, isbinary = None, 0, 0, False

2757

2758

def addresult():

2759

def addresult():

2759

if filename:

2760

if filename:

2760

results.append((filename, adds, removes, isbinary))

2761

results.append((filename, adds, removes, isbinary))

2761

2762

# inheader is used to track if a line is in the

2763

# inheader is used to track if a line is in the

2763

# header portion of the diff. This helps properly account

2764

# header portion of the diff. This helps properly account

2764

# for lines that start with '--' or '++'

2765

# for lines that start with '--' or '++'

2765

inheader = False

2766

inheader = False

2766

2767

for line in lines:

2768

for line in lines:

2768

if line.startswith('diff'):

2769

if line.startswith('diff'):

2769

addresult()

2770

addresult()

2770

# starting a new file diff

2771

# starting a new file diff

2771

# set numbers to 0 and reset inheader

2772

# set numbers to 0 and reset inheader

2772

inheader = True

2773

inheader = True

2773

adds, removes, isbinary = 0, 0, False

2774

adds, removes, isbinary = 0, 0, False

2774

if line.startswith('diff --git a/'):

2775

if line.startswith('diff --git a/'):

2775

filename = gitre.search(line).group(2)

2776

filename = gitre.search(line).group(2)

2776

elif line.startswith('diff -r'):

2777

elif line.startswith('diff -r'):

2777

# format: "diff -r ... -r ... filename"

2778

# format: "diff -r ... -r ... filename"

2778

filename = diffre.search(line).group(1)

2779

filename = diffre.search(line).group(1)

2779

elif line.startswith('@@'):

2780

elif line.startswith('@@'):

2780

inheader = False

2781

inheader = False

2781

elif line.startswith('+') and not inheader:

2782

elif line.startswith('+') and not inheader:

2782

adds += 1

2783

adds += 1

2783

elif line.startswith('-') and not inheader:

2784

elif line.startswith('-') and not inheader:

2784

removes += 1

2785

removes += 1

2785

elif (line.startswith('GIT binary patch') or

2786

elif (line.startswith('GIT binary patch') or

2786

line.startswith('Binary file')):

2787

line.startswith('Binary file')):

2787

isbinary = True

2788

isbinary = True

2788

elif line.startswith('rename from'):

2789

elif line.startswith('rename from'):

2789

filename = line[12:]

2790

filename = line[12:]

2790

elif line.startswith('rename to'):

2791

elif line.startswith('rename to'):

2791

filename += ' => %s' % line[10:]

2792

filename += ' => %s' % line[10:]

2792

addresult()

2793

addresult()

2793

return results

2794

return results

2794

2795

def diffstat(lines, width=80):

2796

def diffstat(lines, width=80):

2796

output = []

2797

output = []

2797

stats = diffstatdata(lines)

2798

stats = diffstatdata(lines)

2798

maxname, maxtotal, totaladds, totalremoves, hasbinary = diffstatsum(stats)

2799

maxname, maxtotal, totaladds, totalremoves, hasbinary = diffstatsum(stats)

2799

2800

countwidth = len(str(maxtotal))

2801

countwidth = len(str(maxtotal))

2801

if hasbinary and countwidth < 3:

2802

if hasbinary and countwidth < 3:

2802

countwidth = 3

2803

countwidth = 3

2803

graphwidth = width - countwidth - maxname - 6

2804

graphwidth = width - countwidth - maxname - 6

2804

if graphwidth < 10:

2805

if graphwidth < 10:

2805

graphwidth = 10

2806

graphwidth = 10

2806

2807

def scale(i):

2808

def scale(i):

2808

if maxtotal <= graphwidth:

2809

if maxtotal <= graphwidth:

2809

return i

2810

return i

2810

# If diffstat runs out of room it doesn't print anything,

2811

# If diffstat runs out of room it doesn't print anything,

2811

# which isn't very useful, so always print at least one + or -

2812

# which isn't very useful, so always print at least one + or -

2812

# if there were at least some changes.

2813

# if there were at least some changes.

2813

return max(i * graphwidth // maxtotal, int(bool(i)))

2814

return max(i * graphwidth // maxtotal, int(bool(i)))

2814

2815

for filename, adds, removes, isbinary in stats:

2816

for filename, adds, removes, isbinary in stats:

2816

if isbinary:

2817

if isbinary:

2817

count = 'Bin'

2818

count = 'Bin'

2818

else:

2819

else:

2819

count = '%d' % (adds + removes)

2820

count = '%d' % (adds + removes)

2820

pluses = '+' * scale(adds)

2821

pluses = '+' * scale(adds)

2821

minuses = '-' * scale(removes)

2822

minuses = '-' * scale(removes)

2822

output.append(' %s%s | %*s %s%s\n' %

2823

output.append(' %s%s | %*s %s%s\n' %

2823

(filename, ' ' * (maxname - encoding.colwidth(filename)),

2824

(filename, ' ' * (maxname - encoding.colwidth(filename)),

2824

countwidth, count, pluses, minuses))

2825

countwidth, count, pluses, minuses))

2825

2826

if stats:

2827

if stats:

2827

output.append(_(' %d files changed, %d insertions(+), '

2828

output.append(_(' %d files changed, %d insertions(+), '

2828

'%d deletions(-)\n')

2829

'%d deletions(-)\n')

2829

% (len(stats), totaladds, totalremoves))

2830

% (len(stats), totaladds, totalremoves))

2830

2831

return ''.join(output)

2832

return ''.join(output)

2832

2833

def diffstatui(*args, **kw):

2834

def diffstatui(*args, **kw):

2834

'''like diffstat(), but yields 2-tuples of (output, label) for

2835

'''like diffstat(), but yields 2-tuples of (output, label) for

2835

ui.write()

2836

ui.write()

2836

'''

2837

'''

2837

2838

for line in diffstat(*args, **kw).splitlines():

2839

for line in diffstat(*args, **kw).splitlines():

2839

if line and line[-1] in '+-':

2840

if line and line[-1] in '+-':

2840

name, graph = line.rsplit(' ', 1)

2841

name, graph = line.rsplit(' ', 1)

2841

yield (name + ' ', '')

2842

yield (name + ' ', '')

2842

m = re.search(br'\++', graph)

2843

m = re.search(br'\++', graph)

2843

if m:

2844

if m:

2844

yield (m.group(0), 'diffstat.inserted')

2845

yield (m.group(0), 'diffstat.inserted')

2845

m = re.search(br'-+', graph)

2846

m = re.search(br'-+', graph)

2846

if m:

2847

if m:

2847

yield (m.group(0), 'diffstat.deleted')

2848

yield (m.group(0), 'diffstat.deleted')

2848

else:

2849

else:

2849

yield (line, '')

2850

yield (line, '')

2850

yield ('\n', '')

2851

yield ('\n', '')

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # patch.py - patch file parsing routines
             #
             # Copyright 2006 Brendan Cully <brendan@kublai.com>
             # Copyright 2007 Chris Mason <chris.mason@oracle.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from __future__ import absolute_import, print_function
             import collections
             import contextlib
             import copy
             import email
             import errno
             import hashlib
             import os
             import re
             import shutil
             import zlib
             from .i18n import _
             from .node import (
                 hex,
                 short,
             )
             from . import (
                 copies,
                 diffhelper,
                 diffutil,
                 encoding,
                 error,
                 mail,
                 mdiff,
                 pathutil,
                 pycompat,
                 scmutil,
                 similar,
                 util,
                 vfs as vfsmod,
             )
             from .utils import (
                 dateutil,
                 procutil,
                 stringutil,
             )
             stringio = util.stringio
             gitre = re.compile(br'diff --git a/(.*) b/(.*)')
             tabsplitter = re.compile(br'(\t+|[^\t]+)')
             wordsplitter = re.compile(br'(\t+| +|[a-zA-Z0-9_\x80-\xff]+|'
                                       b'[^ \ta-zA-Z0-9_\x80-\xff])')
             PatchError = error.PatchError
             # public functions
             def split(stream):
                 '''return an iterator of individual patches from a stream'''
                 def isheader(line, inheader):
                     if inheader and line.startswith((' ', '\t')):
                         # continuation
                         return True
                     if line.startswith((' ', '-', '+')):
                         # diff line - don't check for header pattern in there
                         return False
                     l = line.split(': ', 1)
                     return len(l) == 2 and ' ' not in l[0]
                 def chunk(lines):
                     return stringio(''.join(lines))
                 def hgsplit(stream, cur):
                     inheader = True
                     for line in stream:
                         if not line.strip():
                             inheader = False
                         if not inheader and line.startswith('# HG changeset patch'):
                             yield chunk(cur)
                             cur = []
                             inheader = True
                         cur.append(line)
                     if cur:
                         yield chunk(cur)
                 def mboxsplit(stream, cur):
                     for line in stream:
                         if line.startswith('From '):
                             for c in split(chunk(cur[1:])):
                                 yield c
                             cur = []
                         cur.append(line)
                     if cur:
                         for c in split(chunk(cur[1:])):
                             yield c
                 def mimesplit(stream, cur):
                     def msgfp(m):
                         fp = stringio()
                         g = email.Generator.Generator(fp, mangle_from_=False)
                         g.flatten(m)
                         fp.seek(0)
                         return fp
                     for line in stream:
                         cur.append(line)
                     c = chunk(cur)
                     m = mail.parse(c)
                     if not m.is_multipart():
                         yield msgfp(m)
                     else:
                         ok_types = ('text/plain', 'text/x-diff', 'text/x-patch')
                         for part in m.walk():
                             ct = part.get_content_type()
                             if ct not in ok_types:
                                 continue
                             yield msgfp(part)
                 def headersplit(stream, cur):
                     inheader = False
                     for line in stream:
                         if not inheader and isheader(line, inheader):
                             yield chunk(cur)
                             cur = []
                             inheader = True
                         if inheader and not isheader(line, inheader):
                             inheader = False
                         cur.append(line)
                     if cur:
                         yield chunk(cur)
                 def remainder(cur):
                     yield chunk(cur)
                 class fiter(object):
                     def __init__(self, fp):
                         self.fp = fp
                     def __iter__(self):
                         return self
                     def next(self):
                         l = self.fp.readline()
                         if not l:
                             raise StopIteration
                         return l
                     __next__ = next
                 inheader = False
                 cur = []
                 mimeheaders = ['content-type']
                 if not util.safehasattr(stream, 'next'):
                     # http responses, for example, have readline but not next
                     stream = fiter(stream)
                 for line in stream:
                     cur.append(line)
                     if line.startswith('# HG changeset patch'):
                         return hgsplit(stream, cur)
                     elif line.startswith('From '):
                         return mboxsplit(stream, cur)
                     elif isheader(line, inheader):
                         inheader = True
                         if line.split(':', 1)[0].lower() in mimeheaders:
                             # let email parser handle this
                             return mimesplit(stream, cur)
                     elif line.startswith('--- ') and inheader:
                         # No evil headers seen by diff start, split by hand
                         return headersplit(stream, cur)
                     # Not enough info, keep reading
                 # if we are here, we have a very plain patch
                 return remainder(cur)
             ## Some facility for extensible patch parsing:
             # list of pairs ("header to match", "data key")
             patchheadermap = [('Date', 'date'),
                               ('Branch', 'branch'),
                               ('Node ID', 'nodeid'),
                              ]
             @contextlib.contextmanager
             def extract(ui, fileobj):
                 '''extract patch from data read from fileobj.
                 patch can be a normal patch or contained in an email message.
                 return a dictionary. Standard keys are:
                   - filename,
                   - message,
                   - user,
                   - date,
                   - branch,
                   - node,
                   - p1,
                   - p2.
                 Any item can be missing from the dictionary. If filename is missing,
                 fileobj did not contain a patch. Caller must unlink filename when done.'''
                 fd, tmpname = pycompat.mkstemp(prefix='hg-patch-')
                 tmpfp = os.fdopen(fd, r'wb')
                 try:
                     yield _extract(ui, fileobj, tmpname, tmpfp)
                 finally:
                     tmpfp.close()
                     os.unlink(tmpname)
             def _extract(ui, fileobj, tmpname, tmpfp):
                 # attempt to detect the start of a patch
                 # (this heuristic is borrowed from quilt)
                 diffre = re.compile(br'^(?:Index:[ \t]|diff[ \t]-|RCS file: |'
                                     br'retrieving revision [0-9]+(\.[0-9]+)*$|'
                                     br'---[ \t].*?^\+\+\+[ \t]|'
                                     br'\*\*\*[ \t].*?^---[ \t])',
                                     re.MULTILINE | re.DOTALL)
                 data = {}
                 msg = mail.parse(fileobj)
                 subject = msg[r'Subject'] and mail.headdecode(msg[r'Subject'])
                 data['user'] = msg[r'From'] and mail.headdecode(msg[r'From'])
                 if not subject and not data['user']:
                     # Not an email, restore parsed headers if any
                     subject = '\n'.join(': '.join(map(encoding.strtolocal, h))
                                         for h in msg.items()) + '\n'
                 # should try to parse msg['Date']
                 parents = []
                 if subject:
                     if subject.startswith('[PATCH'):
                         pend = subject.find(']')
                         if pend >= 0:
                             subject = subject[pend + 1:].lstrip()
                     subject = re.sub(br'\n[ \t]+', ' ', subject)
                     ui.debug('Subject: %s\n' % subject)
                 if data['user']:
                     ui.debug('From: %s\n' % data['user'])
                 diffs_seen = 0
                 ok_types = ('text/plain', 'text/x-diff', 'text/x-patch')
                 message = ''
                 for part in msg.walk():
                     content_type = pycompat.bytestr(part.get_content_type())
                     ui.debug('Content-Type: %s\n' % content_type)
                     if content_type not in ok_types:
                         continue
                     payload = part.get_payload(decode=True)
                     m = diffre.search(payload)
                     if m:
                         hgpatch = False
                         hgpatchheader = False
                         ignoretext = False
                         ui.debug('found patch at byte %d\n' % m.start(0))
                         diffs_seen += 1
                         cfp = stringio()
                         for line in payload[:m.start(0)].splitlines():
                             if line.startswith('# HG changeset patch') and not hgpatch:
                                 ui.debug('patch generated by hg export\n')
                                 hgpatch = True
                                 hgpatchheader = True
                                 # drop earlier commit message content
                                 cfp.seek(0)
                                 cfp.truncate()
                                 subject = None
                             elif hgpatchheader:
                                 if line.startswith('# User '):
                                     data['user'] = line[7:]
                                     ui.debug('From: %s\n' % data['user'])
                                 elif line.startswith("# Parent "):
                                     parents.append(line[9:].lstrip())
                                 elif line.startswith("# "):
                                     for header, key in patchheadermap:
                                         prefix = '# %s ' % header
                                         if line.startswith(prefix):
                                             data[key] = line[len(prefix):]
                                 else:
                                     hgpatchheader = False
                             elif line == '---':
                                 ignoretext = True
                             if not hgpatchheader and not ignoretext:
                                 cfp.write(line)
                                 cfp.write('\n')
                         message = cfp.getvalue()
                         if tmpfp:
                             tmpfp.write(payload)
                             if not payload.endswith('\n'):
                                 tmpfp.write('\n')
                     elif not diffs_seen and message and content_type == 'text/plain':
                         message += '\n' + payload
                 if subject and not message.startswith(subject):
                     message = '%s\n%s' % (subject, message)
                 data['message'] = message
                 tmpfp.close()
                 if parents:
                     data['p1'] = parents.pop(0)
                     if parents:
                         data['p2'] = parents.pop(0)
                 if diffs_seen:
                     data['filename'] = tmpname
                 return data
             class patchmeta(object):
                 """Patched file metadata
                 'op' is the performed operation within ADD, DELETE, RENAME, MODIFY
                 or COPY.  'path' is patched file path. 'oldpath' is set to the
                 origin file when 'op' is either COPY or RENAME, None otherwise. If
                 file mode is changed, 'mode' is a tuple (islink, isexec) where
                 'islink' is True if the file is a symlink and 'isexec' is True if
                 the file is executable. Otherwise, 'mode' is None.
                 """
                 def __init__(self, path):
                     self.path = path
                     self.oldpath = None
                     self.mode = None
                     self.op = 'MODIFY'
                     self.binary = False
                 def setmode(self, mode):
                     islink = mode & 0o20000
                     isexec = mode & 0o100
                     self.mode = (islink, isexec)
                 def copy(self):
                     other = patchmeta(self.path)
                     other.oldpath = self.oldpath
                     other.mode = self.mode
                     other.op = self.op
                     other.binary = self.binary
                     return other
                 def _ispatchinga(self, afile):
                     if afile == '/dev/null':
                         return self.op == 'ADD'
                     return afile == 'a/' + (self.oldpath or self.path)
                 def _ispatchingb(self, bfile):
                     if bfile == '/dev/null':
                         return self.op == 'DELETE'
                     return bfile == 'b/' + self.path
                 def ispatching(self, afile, bfile):
                     return self._ispatchinga(afile) and self._ispatchingb(bfile)
                 def __repr__(self):
                     return r"<patchmeta %s %r>" % (self.op, self.path)
             def readgitpatch(lr):
                 """extract git-style metadata about patches from <patchname>"""
                 # Filter patch for git information
                 gp = None
                 gitpatches = []
                 for line in lr:
                     line = line.rstrip(' \r\n')
                     if line.startswith('diff --git a/'):
                         m = gitre.match(line)
                         if m:
                             if gp:
                                 gitpatches.append(gp)
                             dst = m.group(2)
                             gp = patchmeta(dst)
                     elif gp:
                         if line.startswith('--- '):
                             gitpatches.append(gp)
                             gp = None
                             continue
                         if line.startswith('rename from '):
                             gp.op = 'RENAME'
                             gp.oldpath = line[12:]
                         elif line.startswith('rename to '):
                             gp.path = line[10:]
                         elif line.startswith('copy from '):
                             gp.op = 'COPY'
                             gp.oldpath = line[10:]
                         elif line.startswith('copy to '):
                             gp.path = line[8:]
                         elif line.startswith('deleted file'):
                             gp.op = 'DELETE'
                         elif line.startswith('new file mode '):
                             gp.op = 'ADD'
                             gp.setmode(int(line[-6:], 8))
                         elif line.startswith('new mode '):
                             gp.setmode(int(line[-6:], 8))
                         elif line.startswith('GIT binary patch'):
                             gp.binary = True
                 if gp:
                     gitpatches.append(gp)
                 return gitpatches
             class linereader(object):
                 # simple class to allow pushing lines back into the input stream
                 def __init__(self, fp):
                     self.fp = fp
                     self.buf = []
                 def push(self, line):
                     if line is not None:
                         self.buf.append(line)
                 def readline(self):
                     if self.buf:
                         l = self.buf[0]
                         del self.buf[0]
                         return l
                     return self.fp.readline()
                 def __iter__(self):
                     return iter(self.readline, '')
             class abstractbackend(object):
                 def __init__(self, ui):
                     self.ui = ui
                 def getfile(self, fname):
                     """Return target file data and flags as a (data, (islink,
                     isexec)) tuple. Data is None if file is missing/deleted.
                     """
                     raise NotImplementedError
                 def setfile(self, fname, data, mode, copysource):
                     """Write data to target file fname and set its mode. mode is a
                     (islink, isexec) tuple. If data is None, the file content should
                     be left unchanged. If the file is modified after being copied,
                     copysource is set to the original file name.
                     """
                     raise NotImplementedError
                 def unlink(self, fname):
                     """Unlink target file."""
                     raise NotImplementedError
                 def writerej(self, fname, failed, total, lines):
                     """Write rejected lines for fname. total is the number of hunks
                     which failed to apply and total the total number of hunks for this
                     files.
                     """
                 def exists(self, fname):
                     raise NotImplementedError
                 def close(self):
                     raise NotImplementedError
             class fsbackend(abstractbackend):
                 def __init__(self, ui, basedir):
                     super(fsbackend, self).__init__(ui)
                     self.opener = vfsmod.vfs(basedir)
                 def getfile(self, fname):
                     if self.opener.islink(fname):
                         return (self.opener.readlink(fname), (True, False))
                     isexec = False
                     try:
                         isexec = self.opener.lstat(fname).st_mode & 0o100 != 0
                     except OSError as e:
                         if e.errno != errno.ENOENT:
                             raise
                     try:
                         return (self.opener.read(fname), (False, isexec))
                     except IOError as e:
                         if e.errno != errno.ENOENT:
                             raise
                         return None, None
                 def setfile(self, fname, data, mode, copysource):
                     islink, isexec = mode
                     if data is None:
                         self.opener.setflags(fname, islink, isexec)
                         return
                     if islink:
                         self.opener.symlink(data, fname)
                     else:
                         self.opener.write(fname, data)
                         if isexec:
                             self.opener.setflags(fname, False, True)
                 def unlink(self, fname):
                     rmdir = self.ui.configbool('experimental', 'removeemptydirs')
                     self.opener.unlinkpath(fname, ignoremissing=True, rmdir=rmdir)
                 def writerej(self, fname, failed, total, lines):
                     fname = fname + ".rej"
                     self.ui.warn(
                         _("%d out of %d hunks FAILED -- saving rejects to file %s\n") %
                         (failed, total, fname))
                     fp = self.opener(fname, 'w')
                     fp.writelines(lines)
                     fp.close()
                 def exists(self, fname):
                     return self.opener.lexists(fname)
             class workingbackend(fsbackend):
                 def __init__(self, ui, repo, similarity):
                     super(workingbackend, self).__init__(ui, repo.root)
                     self.repo = repo
                     self.similarity = similarity
                     self.removed = set()
                     self.changed = set()
                     self.copied = []
                 def _checkknown(self, fname):
                     if self.repo.dirstate[fname] == '?' and self.exists(fname):
                         raise PatchError(_('cannot patch %s: file is not tracked') % fname)
                 def setfile(self, fname, data, mode, copysource):
                     self._checkknown(fname)
                     super(workingbackend, self).setfile(fname, data, mode, copysource)
                     if copysource is not None:
                         self.copied.append((copysource, fname))
                     self.changed.add(fname)
                 def unlink(self, fname):
                     self._checkknown(fname)
                     super(workingbackend, self).unlink(fname)
                     self.removed.add(fname)
                     self.changed.add(fname)
                 def close(self):
                     wctx = self.repo[None]
                     changed = set(self.changed)
                     for src, dst in self.copied:
                         scmutil.dirstatecopy(self.ui, self.repo, wctx, src, dst)
                     if self.removed:
                         wctx.forget(sorted(self.removed))
                         for f in self.removed:
                             if f not in self.repo.dirstate:
                                 # File was deleted and no longer belongs to the
                                 # dirstate, it was probably marked added then
                                 # deleted, and should not be considered by
                                 # marktouched().
                                 changed.discard(f)
                     if changed:
                         scmutil.marktouched(self.repo, changed, self.similarity)
                     return sorted(self.changed)
             class filestore(object):
                 def __init__(self, maxsize=None):
                     self.opener = None
                     self.files = {}
                     self.created = 0
                     self.maxsize = maxsize
                     if self.maxsize is None:
                         self.maxsize = 4*(2**20)
                     self.size = 0
                     self.data = {}
                 def setfile(self, fname, data, mode, copied=None):
                     if self.maxsize < 0 or (len(data) + self.size) <= self.maxsize:
                         self.data[fname] = (data, mode, copied)
                         self.size += len(data)
                     else:
                         if self.opener is None:
                             root = pycompat.mkdtemp(prefix='hg-patch-')
                             self.opener = vfsmod.vfs(root)
                         # Avoid filename issues with these simple names
                         fn = '%d' % self.created
                         self.opener.write(fn, data)
                         self.created += 1
                         self.files[fname] = (fn, mode, copied)
                 def getfile(self, fname):
                     if fname in self.data:
                         return self.data[fname]
                     if not self.opener or fname not in self.files:
                         return None, None, None
                     fn, mode, copied = self.files[fname]
                     return self.opener.read(fn), mode, copied
                 def close(self):
                     if self.opener:
                         shutil.rmtree(self.opener.base)
             class repobackend(abstractbackend):
                 def __init__(self, ui, repo, ctx, store):
                     super(repobackend, self).__init__(ui)
                     self.repo = repo
                     self.ctx = ctx
                     self.store = store
                     self.changed = set()
                     self.removed = set()
                     self.copied = {}
                 def _checkknown(self, fname):
                     if fname not in self.ctx:
                         raise PatchError(_('cannot patch %s: file is not tracked') % fname)
                 def getfile(self, fname):
                     try:
                         fctx = self.ctx[fname]
                     except error.LookupError:
                         return None, None
                     flags = fctx.flags()
                     return fctx.data(), ('l' in flags, 'x' in flags)
                 def setfile(self, fname, data, mode, copysource):
                     if copysource:
                         self._checkknown(copysource)
                     if data is None:
                         data = self.ctx[fname].data()
                     self.store.setfile(fname, data, mode, copysource)
                     self.changed.add(fname)
                     if copysource:
                         self.copied[fname] = copysource
                 def unlink(self, fname):
                     self._checkknown(fname)
                     self.removed.add(fname)
                 def exists(self, fname):
                     return fname in self.ctx
                 def close(self):
                     return self.changed | self.removed
             # @@ -start,len +start,len @@ or @@ -start +start @@ if len is 1
             unidesc = re.compile(br'@@ -(\d+)(?:,(\d+))? \+(\d+)(?:,(\d+))? @@')
             contextdesc = re.compile(br'(?:---|\*\*\*) (\d+)(?:,(\d+))? (?:---|\*\*\*)')
             eolmodes = ['strict', 'crlf', 'lf', 'auto']
             class patchfile(object):
                 def __init__(self, ui, gp, backend, store, eolmode='strict'):
                     self.fname = gp.path
                     self.eolmode = eolmode
                     self.eol = None
                     self.backend = backend
                     self.ui = ui
                     self.lines = []
                     self.exists = False
                     self.missing = True
                     self.mode = gp.mode
                     self.copysource = gp.oldpath
                     self.create = gp.op in ('ADD', 'COPY', 'RENAME')
                     self.remove = gp.op == 'DELETE'
                     if self.copysource is None:
                         data, mode = backend.getfile(self.fname)
                     else:
                         data, mode = store.getfile(self.copysource)[:2]
                     if data is not None:
                         self.exists = self.copysource is None or backend.exists(self.fname)
                         self.missing = False
                         if data:
                             self.lines = mdiff.splitnewlines(data)
                         if self.mode is None:
                             self.mode = mode
                         if self.lines:
                             # Normalize line endings
                             if self.lines[0].endswith('\r\n'):
                                 self.eol = '\r\n'
                             elif self.lines[0].endswith('\n'):
                                 self.eol = '\n'
                             if eolmode != 'strict':
                                 nlines = []
                                 for l in self.lines:
                                     if l.endswith('\r\n'):
                                         l = l[:-2] + '\n'
                                     nlines.append(l)
                                 self.lines = nlines
                     else:
                         if self.create:
                             self.missing = False
                         if self.mode is None:
                             self.mode = (False, False)
                     if self.missing:
                         self.ui.warn(_("unable to find '%s' for patching\n") % self.fname)
                         self.ui.warn(_("(use '--prefix' to apply patch relative to the "
                                        "current directory)\n"))
                     self.hash = {}
                     self.dirty = 0
                     self.offset = 0
                     self.skew = 0
                     self.rej = []
                     self.fileprinted = False
                     self.printfile(False)
                     self.hunks = 0
                 def writelines(self, fname, lines, mode):
                     if self.eolmode == 'auto':
                         eol = self.eol
                     elif self.eolmode == 'crlf':
                         eol = '\r\n'
                     else:
                         eol = '\n'
                     if self.eolmode != 'strict' and eol and eol != '\n':
                         rawlines = []
                         for l in lines:
                             if l and l.endswith('\n'):
                                 l = l[:-1] + eol
                             rawlines.append(l)
                         lines = rawlines
                     self.backend.setfile(fname, ''.join(lines), mode, self.copysource)
                 def printfile(self, warn):
                     if self.fileprinted:
                         return
                     if warn or self.ui.verbose:
                         self.fileprinted = True
                     s = _("patching file %s\n") % self.fname
                     if warn:
                         self.ui.warn(s)
                     else:
                         self.ui.note(s)
                 def findlines(self, l, linenum):
                     # looks through the hash and finds candidate lines.  The
                     # result is a list of line numbers sorted based on distance
                     # from linenum
                     cand = self.hash.get(l, [])
                     if len(cand) > 1:
                         # resort our list of potentials forward then back.
                         cand.sort(key=lambda x: abs(x - linenum))
                     return cand
                 def write_rej(self):
                     # our rejects are a little different from patch(1).  This always
                     # creates rejects in the same form as the original patch.  A file
                     # header is inserted so that you can run the reject through patch again
                     # without having to type the filename.
                     if not self.rej:
                         return
                     base = os.path.basename(self.fname)
                     lines = ["--- %s\n+++ %s\n" % (base, base)]
                     for x in self.rej:
                         for l in x.hunk:
                             lines.append(l)
                             if l[-1:] != '\n':
                                 lines.append("\n\\ No newline at end of file\n")
                     self.backend.writerej(self.fname, len(self.rej), self.hunks, lines)
                 def apply(self, h):
                     if not h.complete():
                         raise PatchError(_("bad hunk #%d %s (%d %d %d %d)") %
                                         (h.number, h.desc, len(h.a), h.lena, len(h.b),
                                         h.lenb))
                     self.hunks += 1
                     if self.missing:
                         self.rej.append(h)
                         return -1
                     if self.exists and self.create:
                         if self.copysource:
                             self.ui.warn(_("cannot create %s: destination already "
                                            "exists\n") % self.fname)
                         else:
                             self.ui.warn(_("file %s already exists\n") % self.fname)
                         self.rej.append(h)
                         return -1
                     if isinstance(h, binhunk):
                         if self.remove:
                             self.backend.unlink(self.fname)
                         else:
                             l = h.new(self.lines)
                             self.lines[:] = l
                             self.offset += len(l)
                             self.dirty = True
                         return 0
                     horig = h
                     if (self.eolmode in ('crlf', 'lf')
                         or self.eolmode == 'auto' and self.eol):
                         # If new eols are going to be normalized, then normalize
                         # hunk data before patching. Otherwise, preserve input
                         # line-endings.
                         h = h.getnormalized()
                     # fast case first, no offsets, no fuzz
                     old, oldstart, new, newstart = h.fuzzit(0, False)
                     oldstart += self.offset
                     orig_start = oldstart
                     # if there's skew we want to emit the "(offset %d lines)" even
                     # when the hunk cleanly applies at start + skew, so skip the
                     # fast case code
                     if self.skew == 0 and diffhelper.testhunk(old, self.lines, oldstart):
                         if self.remove:
                             self.backend.unlink(self.fname)
                         else:
                             self.lines[oldstart:oldstart + len(old)] = new
                             self.offset += len(new) - len(old)
                             self.dirty = True
                         return 0
                     # ok, we couldn't match the hunk. Lets look for offsets and fuzz it
                     self.hash = {}
                     for x, s in enumerate(self.lines):
                         self.hash.setdefault(s, []).append(x)
                     for fuzzlen in pycompat.xrange(self.ui.configint("patch", "fuzz") + 1):
                         for toponly in [True, False]:
                             old, oldstart, new, newstart = h.fuzzit(fuzzlen, toponly)
                             oldstart = oldstart + self.offset + self.skew
                             oldstart = min(oldstart, len(self.lines))
                             if old:
                                 cand = self.findlines(old[0][1:], oldstart)
                             else:
                                 # Only adding lines with no or fuzzed context, just
                                 # take the skew in account
                                 cand = [oldstart]
                             for l in cand:
                                 if not old or diffhelper.testhunk(old, self.lines, l):
                                     self.lines[l : l + len(old)] = new
                                     self.offset += len(new) - len(old)
                                     self.skew = l - orig_start
                                     self.dirty = True
                                     offset = l - orig_start - fuzzlen
                                     if fuzzlen:
                                         msg = _("Hunk #%d succeeded at %d "
                                                 "with fuzz %d "
                                                 "(offset %d lines).\n")
                                         self.printfile(True)
                                         self.ui.warn(msg %
                                             (h.number, l + 1, fuzzlen, offset))
                                     else:
                                         msg = _("Hunk #%d succeeded at %d "
                                                 "(offset %d lines).\n")
                                         self.ui.note(msg % (h.number, l + 1, offset))
                                     return fuzzlen
                     self.printfile(True)
                     self.ui.warn(_("Hunk #%d FAILED at %d\n") % (h.number, orig_start))
                     self.rej.append(horig)
                     return -1
                 def close(self):
                     if self.dirty:
                         self.writelines(self.fname, self.lines, self.mode)
                     self.write_rej()
                     return len(self.rej)
             class header(object):
                 """patch header
                 """
                 diffgit_re = re.compile('diff --git a/(.*) b/(.*)$')
                 diff_re = re.compile('diff -r .* (.*)$')
                 allhunks_re = re.compile('(?:index|deleted file) ')
                 pretty_re = re.compile('(?:new file|deleted file) ')
                 special_re = re.compile('(?:index|deleted|copy|rename|new mode) ')
                 newfile_re = re.compile('(?:new file)')
                 def __init__(self, header):
                     self.header = header
                     self.hunks = []
                 def binary(self):
                     return any(h.startswith('index ') for h in self.header)
                 def pretty(self, fp):
                     for h in self.header:
                         if h.startswith('index '):
                             fp.write(_('this modifies a binary file (all or nothing)\n'))
                             break
                         if self.pretty_re.match(h):
                             fp.write(h)
                             if self.binary():
                                 fp.write(_('this is a binary file\n'))
                             break
                         if h.startswith('---'):
                             fp.write(_('%d hunks, %d lines changed\n') %
                                      (len(self.hunks),
                                       sum([max(h.added, h.removed) for h in self.hunks])))
                             break
                         fp.write(h)
                 def write(self, fp):
                     fp.write(''.join(self.header))
                 def allhunks(self):
                     return any(self.allhunks_re.match(h) for h in self.header)
                 def files(self):
                     match = self.diffgit_re.match(self.header[0])
                     if match:
                         fromfile, tofile = match.groups()
                         if fromfile == tofile:
                             return [fromfile]
                         return [fromfile, tofile]
                     else:
                         return self.diff_re.match(self.header[0]).groups()
                 def filename(self):
                     return self.files()[-1]
                 def __repr__(self):
                     return '<header %s>' % (' '.join(map(repr, self.files())))
                 def isnewfile(self):
                     return any(self.newfile_re.match(h) for h in self.header)
                 def special(self):
                     # Special files are shown only at the header level and not at the hunk
                     # level for example a file that has been deleted is a special file.
                     # The user cannot change the content of the operation, in the case of
                     # the deleted file he has to take the deletion or not take it, he
                     # cannot take some of it.
                     # Newly added files are special if they are empty, they are not special
                     # if they have some content as we want to be able to change it
                     nocontent = len(self.header) == 2
                     emptynewfile = self.isnewfile() and nocontent
                     return (emptynewfile
                             or any(self.special_re.match(h) for h in self.header))
             class recordhunk(object):
                 """patch hunk
                 XXX shouldn't we merge this with the other hunk class?
                 """
                 def __init__(self, header, fromline, toline, proc, before, hunk, after,
                              maxcontext=None):
                     def trimcontext(lines, reverse=False):
                         if maxcontext is not None:
                             delta = len(lines) - maxcontext
                             if delta > 0:
                                 if reverse:
                                     return delta, lines[delta:]
                                 else:
                                     return delta, lines[:maxcontext]
                         return 0, lines
                     self.header = header
                     trimedbefore, self.before = trimcontext(before, True)
                     self.fromline = fromline + trimedbefore
                     self.toline = toline + trimedbefore
                     _trimedafter, self.after = trimcontext(after, False)
                     self.proc = proc
                     self.hunk = hunk
                     self.added, self.removed = self.countchanges(self.hunk)
                 def __eq__(self, v):
                     if not isinstance(v, recordhunk):
                         return False
                     return ((v.hunk == self.hunk) and
                             (v.proc == self.proc) and
                             (self.fromline == v.fromline) and
                             (self.header.files() == v.header.files()))
                 def __hash__(self):
                     return hash((tuple(self.hunk),
                         tuple(self.header.files()),
                         self.fromline,
                         self.proc))
                 def countchanges(self, hunk):
                     """hunk -> (n+,n-)"""
                     add = len([h for h in hunk if h.startswith('+')])
                     rem = len([h for h in hunk if h.startswith('-')])
                     return add, rem
                 def reversehunk(self):
                     """return another recordhunk which is the reverse of the hunk
                     If this hunk is diff(A, B), the returned hunk is diff(B, A). To do
                     that, swap fromline/toline and +/- signs while keep other things
                     unchanged.
                     """
                     m = {'+': '-', '-': '+', '\\': '\\'}
                     hunk = ['%s%s' % (m[l[0:1]], l[1:]) for l in self.hunk]
                     return recordhunk(self.header, self.toline, self.fromline, self.proc,
                                       self.before, hunk, self.after)
                 def write(self, fp):
                     delta = len(self.before) + len(self.after)
                     if self.after and self.after[-1] == '\\ No newline at end of file\n':
                         delta -= 1
                     fromlen = delta + self.removed
                     tolen = delta + self.added
                     fp.write('@@ -%d,%d +%d,%d @@%s\n' %
                              (self.fromline, fromlen, self.toline, tolen,
                               self.proc and (' ' + self.proc)))
                     fp.write(''.join(self.before + self.hunk + self.after))
                 pretty = write
                 def filename(self):
                     return self.header.filename()
                 def __repr__(self):
                     return '<hunk %r@%d>' % (self.filename(), self.fromline)
             def getmessages():
                 return {
                     'multiple': {
                         'apply': _("apply change %d/%d to '%s'?"),
                         'discard': _("discard change %d/%d to '%s'?"),
                         'record': _("record change %d/%d to '%s'?"),
                     },
                     'single': {
                         'apply': _("apply this change to '%s'?"),
                         'discard': _("discard this change to '%s'?"),
                         'record': _("record this change to '%s'?"),
                     },
                     'help': {
                         'apply': _('[Ynesfdaq?]'
                                      '$$ &Yes, apply this change'
                                      '$$ &No, skip this change'
                                      '$$ &Edit this change manually'
                                      '$$ &Skip remaining changes to this file'
                                      '$$ Apply remaining changes to this &file'
                                      '$$ &Done, skip remaining changes and files'
                                      '$$ Apply &all changes to all remaining files'
                                      '$$ &Quit, applying no changes'
                                      '$$ &? (display help)'),
                         'discard': _('[Ynesfdaq?]'
                                      '$$ &Yes, discard this change'
                                      '$$ &No, skip this change'
                                      '$$ &Edit this change manually'
                                      '$$ &Skip remaining changes to this file'
                                      '$$ Discard remaining changes to this &file'
                                      '$$ &Done, skip remaining changes and files'
                                      '$$ Discard &all changes to all remaining files'
                                      '$$ &Quit, discarding no changes'
                                      '$$ &? (display help)'),
                         'record': _('[Ynesfdaq?]'
                                     '$$ &Yes, record this change'
                                     '$$ &No, skip this change'
                                     '$$ &Edit this change manually'
                                     '$$ &Skip remaining changes to this file'
                                     '$$ Record remaining changes to this &file'
                                     '$$ &Done, skip remaining changes and files'
                                     '$$ Record &all changes to all remaining files'
                                     '$$ &Quit, recording no changes'
                                     '$$ &? (display help)'),
                     }
                 }
             def filterpatch(ui, headers, operation=None):
                 """Interactively filter patch chunks into applied-only chunks"""
                 messages = getmessages()
                 if operation is None:
                     operation = 'record'
                 def prompt(skipfile, skipall, query, chunk):
                     """prompt query, and process base inputs
                     - y/n for the rest of file
                     - y/n for the rest
                     - ? (help)
                     - q (quit)
                     Return True/False and possibly updated skipfile and skipall.
                     """
                     newpatches = None
                     if skipall is not None:
                         return skipall, skipfile, skipall, newpatches
                     if skipfile is not None:
                         return skipfile, skipfile, skipall, newpatches
                     while True:
                         resps = messages['help'][operation]
                         r = ui.promptchoice("%s %s" % (query, resps))
                         ui.write("\n")
                         if r == 8: # ?
                             for c, t in ui.extractchoices(resps)[1]:
                                 ui.write('%s - %s\n' % (c, encoding.lower(t)))
                             continue
                         elif r == 0: # yes
                             ret = True
                         elif r == 1: # no
                             ret = False
                         elif r == 2: # Edit patch
                             if chunk is None:
                                 ui.write(_('cannot edit patch for whole file'))
                                 ui.write("\n")
                                 continue
                             if chunk.header.binary():
                                 ui.write(_('cannot edit patch for binary file'))
                                 ui.write("\n")
                                 continue
                             # Patch comment based on the Git one (based on comment at end of
                             # https://mercurial-scm.org/wiki/RecordExtension)
                             phelp = '---' + _("""
             To remove '-' lines, make them ' ' lines (context).
             To remove '+' lines, delete them.
             Lines starting with # will be removed from the patch.
             If the patch applies cleanly, the edited hunk will immediately be
             added to the record list. If it does not apply cleanly, a rejects
             file will be generated: you can use that when you try again. If
             all lines of the hunk are removed, then the edit is aborted and
             the hunk is left unchanged.
             """)
                             (patchfd, patchfn) = pycompat.mkstemp(prefix="hg-editor-",
                                                                   suffix=".diff")
                             ncpatchfp = None
                             try:
                                 # Write the initial patch
                                 f = util.nativeeolwriter(os.fdopen(patchfd, r'wb'))
                                 chunk.header.write(f)
                                 chunk.write(f)
-                                f.write('\n'.join(['# ' + i for i in phelp.splitlines()]))
+                                f.write(''.join(['# ' + i + '\n'
+                                                 for i in phelp.splitlines()]))
                                 f.close()
                                 # Start the editor and wait for it to complete
                                 editor = ui.geteditor()
                                 ret = ui.system("%s \"%s\"" % (editor, patchfn),
                                                 environ={'HGUSER': ui.username()},
                                                 blockedtag='filterpatch')
                                 if ret != 0:
                                     ui.warn(_("editor exited with exit code %d\n") % ret)
                                     continue
                                 # Remove comment lines
                                 patchfp = open(patchfn, r'rb')
                                 ncpatchfp = stringio()
                                 for line in util.iterfile(patchfp):
                                     line = util.fromnativeeol(line)
                                     if not line.startswith('#'):
                                         ncpatchfp.write(line)
                                 patchfp.close()
                                 ncpatchfp.seek(0)
                                 newpatches = parsepatch(ncpatchfp)
                             finally:
                                 os.unlink(patchfn)
                                 del ncpatchfp
                             # Signal that the chunk shouldn't be applied as-is, but
                             # provide the new patch to be used instead.
                             ret = False
                         elif r == 3: # Skip
                             ret = skipfile = False
                         elif r == 4: # file (Record remaining)
                             ret = skipfile = True
                         elif r == 5: # done, skip remaining
                             ret = skipall = False
                         elif r == 6: # all
                             ret = skipall = True
                         elif r == 7: # quit
                             raise error.Abort(_('user quit'))
                         return ret, skipfile, skipall, newpatches
                 seen = set()
                 applied = {}        # 'filename' -> [] of chunks
                 skipfile, skipall = None, None
                 pos, total = 1, sum(len(h.hunks) for h in headers)
                 for h in headers:
                     pos += len(h.hunks)
                     skipfile = None
                     fixoffset = 0
                     hdr = ''.join(h.header)
                     if hdr in seen:
                         continue
                     seen.add(hdr)
                     if skipall is None:
                         h.pretty(ui)
                     msg = (_('examine changes to %s?') %
                            _(' and ').join("'%s'" % f for f in h.files()))
                     r, skipfile, skipall, np = prompt(skipfile, skipall, msg, None)
                     if not r:
                         continue
                     applied[h.filename()] = [h]
                     if h.allhunks():
                         applied[h.filename()] += h.hunks
                         continue
                     for i, chunk in enumerate(h.hunks):
                         if skipfile is None and skipall is None:
                             chunk.pretty(ui)
                         if total == 1:
                             msg = messages['single'][operation] % chunk.filename()
                         else:
                             idx = pos - len(h.hunks) + i
                             msg = messages['multiple'][operation] % (idx, total,
                                                                      chunk.filename())
                         r, skipfile, skipall, newpatches = prompt(skipfile,
                                 skipall, msg, chunk)
                         if r:
                             if fixoffset:
                                 chunk = copy.copy(chunk)
                                 chunk.toline += fixoffset
                             applied[chunk.filename()].append(chunk)
                         elif newpatches is not None:
                             for newpatch in newpatches:
                                 for newhunk in newpatch.hunks:
                                     if fixoffset:
                                         newhunk.toline += fixoffset
                                     applied[newhunk.filename()].append(newhunk)
                         else:
                             fixoffset += chunk.removed - chunk.added
                 return (sum([h for h in applied.itervalues()
                            if h[0].special() or len(h) > 1], []), {})
             class hunk(object):
                 def __init__(self, desc, num, lr, context):
                     self.number = num
                     self.desc = desc
                     self.hunk = [desc]
                     self.a = []
                     self.b = []
                     self.starta = self.lena = None
                     self.startb = self.lenb = None
                     if lr is not None:
                         if context:
                             self.read_context_hunk(lr)
                         else:
                             self.read_unified_hunk(lr)
                 def getnormalized(self):
                     """Return a copy with line endings normalized to LF."""
                     def normalize(lines):
                         nlines = []
                         for line in lines:
                             if line.endswith('\r\n'):
                                 line = line[:-2] + '\n'
                             nlines.append(line)
                         return nlines
                     # Dummy object, it is rebuilt manually
                     nh = hunk(self.desc, self.number, None, None)
                     nh.number = self.number
                     nh.desc = self.desc
                     nh.hunk = self.hunk
                     nh.a = normalize(self.a)
                     nh.b = normalize(self.b)
                     nh.starta = self.starta
                     nh.startb = self.startb
                     nh.lena = self.lena
                     nh.lenb = self.lenb
                     return nh
                 def read_unified_hunk(self, lr):
                     m = unidesc.match(self.desc)
                     if not m:
                         raise PatchError(_("bad hunk #%d") % self.number)
                     self.starta, self.lena, self.startb, self.lenb = m.groups()
                     if self.lena is None:
                         self.lena = 1
                     else:
                         self.lena = int(self.lena)
                     if self.lenb is None:
                         self.lenb = 1
                     else:
                         self.lenb = int(self.lenb)
                     self.starta = int(self.starta)
                     self.startb = int(self.startb)
                     try:
                         diffhelper.addlines(lr, self.hunk, self.lena, self.lenb,
                                             self.a, self.b)
                     except error.ParseError as e:
                         raise PatchError(_("bad hunk #%d: %s") % (self.number, e))
                     # if we hit eof before finishing out the hunk, the last line will
                     # be zero length.  Lets try to fix it up.
                     while len(self.hunk[-1]) == 0:
                         del self.hunk[-1]
                         del self.a[-1]
                         del self.b[-1]
                         self.lena -= 1
                         self.lenb -= 1
                     self._fixnewline(lr)
                 def read_context_hunk(self, lr):
                     self.desc = lr.readline()
                     m = contextdesc.match(self.desc)
                     if not m:
                         raise PatchError(_("bad hunk #%d") % self.number)
                     self.starta, aend = m.groups()
                     self.starta = int(self.starta)
                     if aend is None:
                         aend = self.starta
                     self.lena = int(aend) - self.starta
                     if self.starta:
                         self.lena += 1
                     for x in pycompat.xrange(self.lena):
                         l = lr.readline()
                         if l.startswith('---'):
                             # lines addition, old block is empty
                             lr.push(l)
                             break
                         s = l[2:]
                         if l.startswith('- ') or l.startswith('! '):
                             u = '-' + s
                         elif l.startswith('  '):
                             u = ' ' + s
                         else:
                             raise PatchError(_("bad hunk #%d old text line %d") %
                                              (self.number, x))
                         self.a.append(u)
                         self.hunk.append(u)
                     l = lr.readline()
                     if l.startswith(br'\ '):
                         s = self.a[-1][:-1]
                         self.a[-1] = s
                         self.hunk[-1] = s
                         l = lr.readline()
                     m = contextdesc.match(l)
                     if not m:
                         raise PatchError(_("bad hunk #%d") % self.number)
                     self.startb, bend = m.groups()
                     self.startb = int(self.startb)
                     if bend is None:
                         bend = self.startb
                     self.lenb = int(bend) - self.startb
                     if self.startb:
                         self.lenb += 1
                     hunki = 1
                     for x in pycompat.xrange(self.lenb):
                         l = lr.readline()
                         if l.startswith(br'\ '):
                             # XXX: the only way to hit this is with an invalid line range.
                             # The no-eol marker is not counted in the line range, but I
                             # guess there are diff(1) out there which behave differently.
                             s = self.b[-1][:-1]
                             self.b[-1] = s
                             self.hunk[hunki - 1] = s
                             continue
                         if not l:
                             # line deletions, new block is empty and we hit EOF
                             lr.push(l)
                             break
                         s = l[2:]
                         if l.startswith('+ ') or l.startswith('! '):
                             u = '+' + s
                         elif l.startswith('  '):
                             u = ' ' + s
                         elif len(self.b) == 0:
                             # line deletions, new block is empty
                             lr.push(l)
                             break
                         else:
                             raise PatchError(_("bad hunk #%d old text line %d") %
                                              (self.number, x))
                         self.b.append(s)
                         while True:
                             if hunki >= len(self.hunk):
                                 h = ""
                             else:
                                 h = self.hunk[hunki]
                             hunki += 1
                             if h == u:
                                 break
                             elif h.startswith('-'):
                                 continue
                             else:
                                 self.hunk.insert(hunki - 1, u)
                                 break
                     if not self.a:
                         # this happens when lines were only added to the hunk
                         for x in self.hunk:
                             if x.startswith('-') or x.startswith(' '):
                                 self.a.append(x)
                     if not self.b:
                         # this happens when lines were only deleted from the hunk
                         for x in self.hunk:
                             if x.startswith('+') or x.startswith(' '):
                                 self.b.append(x[1:])
                     # @@ -start,len +start,len @@
                     self.desc = "@@ -%d,%d +%d,%d @@\n" % (self.starta, self.lena,
                                                          self.startb, self.lenb)
                     self.hunk[0] = self.desc
                     self._fixnewline(lr)
                 def _fixnewline(self, lr):
                     l = lr.readline()
                     if l.startswith(br'\ '):
                         diffhelper.fixnewline(self.hunk, self.a, self.b)
                     else:
                         lr.push(l)
                 def complete(self):
                     return len(self.a) == self.lena and len(self.b) == self.lenb
                 def _fuzzit(self, old, new, fuzz, toponly):
                     # this removes context lines from the top and bottom of list 'l'.  It
                     # checks the hunk to make sure only context lines are removed, and then
                     # returns a new shortened list of lines.
                     fuzz = min(fuzz, len(old))
                     if fuzz:
                         top = 0
                         bot = 0
                         hlen = len(self.hunk)
                         for x in pycompat.xrange(hlen - 1):
                             # the hunk starts with the @@ line, so use x+1
                             if self.hunk[x + 1].startswith(' '):
                                 top += 1
                             else:
                                 break
                         if not toponly:
                             for x in pycompat.xrange(hlen - 1):
                                 if self.hunk[hlen - bot - 1].startswith(' '):
                                     bot += 1
                                 else:
                                     break
                         bot = min(fuzz, bot)
                         top = min(fuzz, top)
                         return old[top:len(old) - bot], new[top:len(new) - bot], top
                     return old, new, 0
                 def fuzzit(self, fuzz, toponly):
                     old, new, top = self._fuzzit(self.a, self.b, fuzz, toponly)
                     oldstart = self.starta + top
                     newstart = self.startb + top
                     # zero length hunk ranges already have their start decremented
                     if self.lena and oldstart > 0:
                         oldstart -= 1
                     if self.lenb and newstart > 0:
                         newstart -= 1
                     return old, oldstart, new, newstart
             class binhunk(object):
                 'A binary patch file.'
                 def __init__(self, lr, fname):
                     self.text = None
                     self.delta = False
                     self.hunk = ['GIT binary patch\n']
                     self._fname = fname
                     self._read(lr)
                 def complete(self):
                     return self.text is not None
                 def new(self, lines):
                     if self.delta:
                         return [applybindelta(self.text, ''.join(lines))]
                     return [self.text]
                 def _read(self, lr):
                     def getline(lr, hunk):
                         l = lr.readline()
                         hunk.append(l)
                         return l.rstrip('\r\n')
                     while True:
                         line = getline(lr, self.hunk)
                         if not line:
                             raise PatchError(_('could not extract "%s" binary data')
                                              % self._fname)
                         if line.startswith('literal '):
                             size = int(line[8:].rstrip())
                             break
                         if line.startswith('delta '):
                             size = int(line[6:].rstrip())
                             self.delta = True
                             break
                     dec = []
                     line = getline(lr, self.hunk)
                     while len(line) > 1:
                         l = line[0:1]
                         if l <= 'Z' and l >= 'A':
                             l = ord(l) - ord('A') + 1
                         else:
                             l = ord(l) - ord('a') + 27
                         try:
                             dec.append(util.b85decode(line[1:])[:l])
                         except ValueError as e:
                             raise PatchError(_('could not decode "%s" binary patch: %s')
                                              % (self._fname, stringutil.forcebytestr(e)))
                         line = getline(lr, self.hunk)
                     text = zlib.decompress(''.join(dec))
                     if len(text) != size:
                         raise PatchError(_('"%s" length is %d bytes, should be %d')
                                          % (self._fname, len(text), size))
                     self.text = text
             def parsefilename(str):
                 # --- filename \t|space stuff
                 s = str[4:].rstrip('\r\n')
                 i = s.find('\t')
                 if i < 0:
                     i = s.find(' ')
                     if i < 0:
                         return s
                 return s[:i]
             def reversehunks(hunks):
                 '''reverse the signs in the hunks given as argument
                 This function operates on hunks coming out of patch.filterpatch, that is
                 a list of the form: [header1, hunk1, hunk2, header2...]. Example usage:
                 >>> rawpatch = b"""diff --git a/folder1/g b/folder1/g
                 ... --- a/folder1/g
                 ... +++ b/folder1/g
                 ... @@ -1,7 +1,7 @@
                 ... +firstline
                 ...  c
                 ...  1
                 ...  2
                 ... + 3
                 ... -4
                 ...  5
                 ...  d
                 ... +lastline"""
                 >>> hunks = parsepatch([rawpatch])
                 >>> hunkscomingfromfilterpatch = []
                 >>> for h in hunks:
                 ...     hunkscomingfromfilterpatch.append(h)
                 ...     hunkscomingfromfilterpatch.extend(h.hunks)
                 >>> reversedhunks = reversehunks(hunkscomingfromfilterpatch)
                 >>> from . import util
                 >>> fp = util.stringio()
                 >>> for c in reversedhunks:
                 ...      c.write(fp)
                 >>> fp.seek(0) or None
                 >>> reversedpatch = fp.read()
                 >>> print(pycompat.sysstr(reversedpatch))
                 diff --git a/folder1/g b/folder1/g
                 --- a/folder1/g
                 +++ b/folder1/g
                 @@ -1,4 +1,3 @@
                 -firstline
                  c
                 @@ -2,6 +1,6 @@
                  c
                 - 3
                 +4
                  d
                 @@ -6,3 +5,2 @@
                  d
                 -lastline
                 '''
                 newhunks = []
                 for c in hunks:
                     if util.safehasattr(c, 'reversehunk'):
                         c = c.reversehunk()
                     newhunks.append(c)
                 return newhunks
             def parsepatch(originalchunks, maxcontext=None):
                 """patch -> [] of headers -> [] of hunks
                 If maxcontext is not None, trim context lines if necessary.
                 >>> rawpatch = b'''diff --git a/folder1/g b/folder1/g
                 ... --- a/folder1/g
                 ... +++ b/folder1/g
                 ... @@ -1,8 +1,10 @@
                 ...  1
                 ...  2
                 ... -3
                 ...  4
                 ...  5
                 ...  6
                 ... +6.1
                 ... +6.2
                 ...  7
                 ...  8
                 ... +9'''
                 >>> out = util.stringio()
                 >>> headers = parsepatch([rawpatch], maxcontext=1)
                 >>> for header in headers:
                 ...     header.write(out)
                 ...     for hunk in header.hunks:
                 ...         hunk.write(out)
                 >>> print(pycompat.sysstr(out.getvalue()))
                 diff --git a/folder1/g b/folder1/g
                 --- a/folder1/g
                 +++ b/folder1/g
                 @@ -2,3 +2,2 @@
                 -3
                 @@ -6,2 +5,4 @@
                 +6.1
                 +6.2
                 @@ -8,1 +9,2 @@
                 +9
                 """
                 class parser(object):
                     """patch parsing state machine"""
                     def __init__(self):
                         self.fromline = 0
                         self.toline = 0
                         self.proc = ''
                         self.header = None
                         self.context = []
                         self.before = []
                         self.hunk = []
                         self.headers = []
                     def addrange(self, limits):
                         self.addcontext([])
                         fromstart, fromend, tostart, toend, proc = limits
                         self.fromline = int(fromstart)
                         self.toline = int(tostart)
                         self.proc = proc
                     def addcontext(self, context):
                         if self.hunk:
                             h = recordhunk(self.header, self.fromline, self.toline,
                                     self.proc, self.before, self.hunk, context, maxcontext)
                             self.header.hunks.append(h)
                             self.fromline += len(self.before) + h.removed
                             self.toline += len(self.before) + h.added
                             self.before = []
                             self.hunk = []
                         self.context = context
                     def addhunk(self, hunk):
                         if self.context:
                             self.before = self.context
                             self.context = []
                         if self.hunk:
                             self.addcontext([])
                         self.hunk = hunk
                     def newfile(self, hdr):
                         self.addcontext([])
                         h = header(hdr)
                         self.headers.append(h)
                         self.header = h
                     def addother(self, line):
                         pass # 'other' lines are ignored
                     def finished(self):
                         self.addcontext([])
                         return self.headers
                     transitions = {
                         'file': {'context': addcontext,
                                  'file': newfile,
                                  'hunk': addhunk,
                                  'range': addrange},
                         'context': {'file': newfile,
                                     'hunk': addhunk,
                                     'range': addrange,
                                     'other': addother},
                         'hunk': {'context': addcontext,
                                  'file': newfile,
                                  'range': addrange},
                         'range': {'context': addcontext,
                                   'hunk': addhunk},
                         'other': {'other': addother},
                         }
                 p = parser()
                 fp = stringio()
                 fp.write(''.join(originalchunks))
                 fp.seek(0)
                 state = 'context'
                 for newstate, data in scanpatch(fp):
                     try:
                         p.transitions[state][newstate](p, data)
                     except KeyError:
                         raise PatchError('unhandled transition: %s -> %s' %
                                                (state, newstate))
                     state = newstate
                 del fp
                 return p.finished()
             def pathtransform(path, strip, prefix):
                 '''turn a path from a patch into a path suitable for the repository
                 prefix, if not empty, is expected to be normalized with a / at the end.
                 Returns (stripped components, path in repository).
                 >>> pathtransform(b'a/b/c', 0, b'')
                 ('', 'a/b/c')
                 >>> pathtransform(b'   a/b/c   ', 0, b'')
                 ('', '   a/b/c')
                 >>> pathtransform(b'   a/b/c   ', 2, b'')
                 ('a/b/', 'c')
                 >>> pathtransform(b'a/b/c', 0, b'd/e/')
                 ('', 'd/e/a/b/c')
                 >>> pathtransform(b'   a//b/c   ', 2, b'd/e/')
                 ('a//b/', 'd/e/c')
                 >>> pathtransform(b'a/b/c', 3, b'')
                 Traceback (most recent call last):
                 PatchError: unable to strip away 1 of 3 dirs from a/b/c
                 '''
                 pathlen = len(path)
                 i = 0
                 if strip == 0:
                     return '', prefix + path.rstrip()
                 count = strip
                 while count > 0:
                     i = path.find('/', i)
                     if i == -1:
                         raise PatchError(_("unable to strip away %d of %d dirs from %s") %
                                          (count, strip, path))
                     i += 1
                     # consume '//' in the path
                     while i < pathlen - 1 and path[i:i + 1] == '/':
                         i += 1
                     count -= 1
                 return path[:i].lstrip(), prefix + path[i:].rstrip()
             def makepatchmeta(backend, afile_orig, bfile_orig, hunk, strip, prefix):
                 nulla = afile_orig == "/dev/null"
                 nullb = bfile_orig == "/dev/null"
                 create = nulla and hunk.starta == 0 and hunk.lena == 0
                 remove = nullb and hunk.startb == 0 and hunk.lenb == 0
                 abase, afile = pathtransform(afile_orig, strip, prefix)
                 gooda = not nulla and backend.exists(afile)
                 bbase, bfile = pathtransform(bfile_orig, strip, prefix)
                 if afile == bfile:
                     goodb = gooda
                 else:
                     goodb = not nullb and backend.exists(bfile)
                 missing = not goodb and not gooda and not create
                 # some diff programs apparently produce patches where the afile is
                 # not /dev/null, but afile starts with bfile
                 abasedir = afile[:afile.rfind('/') + 1]
                 bbasedir = bfile[:bfile.rfind('/') + 1]
                 if (missing and abasedir == bbasedir and afile.startswith(bfile)
                     and hunk.starta == 0 and hunk.lena == 0):
                     create = True
                     missing = False
                 # If afile is "a/b/foo" and bfile is "a/b/foo.orig" we assume the
                 # diff is between a file and its backup. In this case, the original
                 # file should be patched (see original mpatch code).
                 isbackup = (abase == bbase and bfile.startswith(afile))
                 fname = None
                 if not missing:
                     if gooda and goodb:
                         if isbackup:
                             fname = afile
                         else:
                             fname = bfile
                     elif gooda:
                         fname = afile
                 if not fname:
                     if not nullb:
                         if isbackup:
                             fname = afile
                         else:
                             fname = bfile
                     elif not nulla:
                         fname = afile
                     else:
                         raise PatchError(_("undefined source and destination files"))
                 gp = patchmeta(fname)
                 if create:
                     gp.op = 'ADD'
                 elif remove:
                     gp.op = 'DELETE'
                 return gp
             def scanpatch(fp):
                 """like patch.iterhunks, but yield different events
                 - ('file',    [header_lines + fromfile + tofile])
                 - ('context', [context_lines])
                 - ('hunk',    [hunk_lines])
                 - ('range',   (-start,len, +start,len, proc))
                 """
                 lines_re = re.compile(br'@@ -(\d+),(\d+) \+(\d+),(\d+) @@\s*(.*)')
                 lr = linereader(fp)
                 def scanwhile(first, p):
                     """scan lr while predicate holds"""
                     lines = [first]
                     for line in iter(lr.readline, ''):
                         if p(line):
                             lines.append(line)
                         else:
                             lr.push(line)
                             break
                     return lines
                 for line in iter(lr.readline, ''):
                     if line.startswith('diff --git a/') or line.startswith('diff -r '):
                         def notheader(line):
                             s = line.split(None, 1)
                             return not s or s[0] not in ('---', 'diff')
                         header = scanwhile(line, notheader)
                         fromfile = lr.readline()
                         if fromfile.startswith('---'):
                             tofile = lr.readline()
                             header += [fromfile, tofile]
                         else:
                             lr.push(fromfile)
                         yield 'file', header
                     elif line.startswith(' '):
                         cs = (' ', '\\')
                         yield 'context', scanwhile(line, lambda l: l.startswith(cs))
                     elif line.startswith(('-', '+')):
                         cs = ('-', '+', '\\')
                         yield 'hunk', scanwhile(line, lambda l: l.startswith(cs))
                     else:
                         m = lines_re.match(line)
                         if m:
                             yield 'range', m.groups()
                         else:
                             yield 'other', line
             def scangitpatch(lr, firstline):
                 """
                 Git patches can emit:
                 - rename a to b
                 - change b
                 - copy a to c
                 - change c
                 We cannot apply this sequence as-is, the renamed 'a' could not be
                 found for it would have been renamed already. And we cannot copy
                 from 'b' instead because 'b' would have been changed already. So
                 we scan the git patch for copy and rename commands so we can
                 perform the copies ahead of time.
                 """
                 pos = 0
                 try:
                     pos = lr.fp.tell()
                     fp = lr.fp
                 except IOError:
                     fp = stringio(lr.fp.read())
                 gitlr = linereader(fp)
                 gitlr.push(firstline)
                 gitpatches = readgitpatch(gitlr)
                 fp.seek(pos)
                 return gitpatches
             def iterhunks(fp):
                 """Read a patch and yield the following events:
                 - ("file", afile, bfile, firsthunk): select a new target file.
                 - ("hunk", hunk): a new hunk is ready to be applied, follows a
                 "file" event.
                 - ("git", gitchanges): current diff is in git format, gitchanges
                 maps filenames to gitpatch records. Unique event.
                 """
                 afile = ""
                 bfile = ""
                 state = None
                 hunknum = 0
                 emitfile = newfile = False
                 gitpatches = None
                 # our states
                 BFILE = 1
                 context = None
                 lr = linereader(fp)
                 for x in iter(lr.readline, ''):
                     if state == BFILE and (
                         (not context and x.startswith('@'))
                         or (context is not False and x.startswith('***************'))
                         or x.startswith('GIT binary patch')):
                         gp = None
                         if (gitpatches and
                             gitpatches[-1].ispatching(afile, bfile)):
                             gp = gitpatches.pop()
                         if x.startswith('GIT binary patch'):
                             h = binhunk(lr, gp.path)
                         else:
                             if context is None and x.startswith('***************'):
                                 context = True
                             h = hunk(x, hunknum + 1, lr, context)
                         hunknum += 1
                         if emitfile:
                             emitfile = False
                             yield 'file', (afile, bfile, h, gp and gp.copy() or None)
                         yield 'hunk', h
                     elif x.startswith('diff --git a/'):
                         m = gitre.match(x.rstrip(' \r\n'))
                         if not m:
                             continue
                         if gitpatches is None:
                             # scan whole input for git metadata
                             gitpatches = scangitpatch(lr, x)
                             yield 'git', [g.copy() for g in gitpatches
                                           if g.op in ('COPY', 'RENAME')]
                             gitpatches.reverse()
                         afile = 'a/' + m.group(1)
                         bfile = 'b/' + m.group(2)
                         while gitpatches and not gitpatches[-1].ispatching(afile, bfile):
                             gp = gitpatches.pop()
                             yield 'file', ('a/' + gp.path, 'b/' + gp.path, None, gp.copy())
                         if not gitpatches:
                             raise PatchError(_('failed to synchronize metadata for "%s"')
                                              % afile[2:])
                         newfile = True
                     elif x.startswith('---'):
                         # check for a unified diff
                         l2 = lr.readline()
                         if not l2.startswith('+++'):
                             lr.push(l2)
                             continue
                         newfile = True
                         context = False
                         afile = parsefilename(x)
                         bfile = parsefilename(l2)
                     elif x.startswith('***'):
                         # check for a context diff
                         l2 = lr.readline()
                         if not l2.startswith('---'):
                             lr.push(l2)
                             continue
                         l3 = lr.readline()
                         lr.push(l3)
                         if not l3.startswith("***************"):
                             lr.push(l2)
                             continue
                         newfile = True
                         context = True
                         afile = parsefilename(x)
                         bfile = parsefilename(l2)
                     if newfile:
                         newfile = False
                         emitfile = True
                         state = BFILE
                         hunknum = 0
                 while gitpatches:
                     gp = gitpatches.pop()
                     yield 'file', ('a/' + gp.path, 'b/' + gp.path, None, gp.copy())
             def applybindelta(binchunk, data):
                 """Apply a binary delta hunk
                 The algorithm used is the algorithm from git's patch-delta.c
                 """
                 def deltahead(binchunk):
                     i = 0
                     for c in pycompat.bytestr(binchunk):
                         i += 1
                         if not (ord(c) & 0x80):
                             return i
                     return i
                 out = ""
                 s = deltahead(binchunk)
                 binchunk = binchunk[s:]
                 s = deltahead(binchunk)
                 binchunk = binchunk[s:]
                 i = 0
                 while i < len(binchunk):
                     cmd = ord(binchunk[i:i + 1])
                     i += 1
                     if (cmd & 0x80):
                         offset = 0
                         size = 0
                         if (cmd & 0x01):
                             offset = ord(binchunk[i:i + 1])
                             i += 1
                         if (cmd & 0x02):
                             offset |= ord(binchunk[i:i + 1]) << 8
                             i += 1
                         if (cmd & 0x04):
                             offset |= ord(binchunk[i:i + 1]) << 16
                             i += 1
                         if (cmd & 0x08):
                             offset |= ord(binchunk[i:i + 1]) << 24
                             i += 1
                         if (cmd & 0x10):
                             size = ord(binchunk[i:i + 1])
                             i += 1
                         if (cmd & 0x20):
                             size |= ord(binchunk[i:i + 1]) << 8
                             i += 1
                         if (cmd & 0x40):
                             size |= ord(binchunk[i:i + 1]) << 16
                             i += 1
                         if size == 0:
                             size = 0x10000
                         offset_end = offset + size
                         out += data[offset:offset_end]
                     elif cmd != 0:
                         offset_end = i + cmd
                         out += binchunk[i:offset_end]
                         i += cmd
                     else:
                         raise PatchError(_('unexpected delta opcode 0'))
                 return out
             def applydiff(ui, fp, backend, store, strip=1, prefix='', eolmode='strict'):
                 """Reads a patch from fp and tries to apply it.
                 Returns 0 for a clean patch, -1 if any rejects were found and 1 if
                 there was any fuzz.
                 If 'eolmode' is 'strict', the patch content and patched file are
                 read in binary mode. Otherwise, line endings are ignored when
                 patching then normalized according to 'eolmode'.
                 """
                 return _applydiff(ui, fp, patchfile, backend, store, strip=strip,
                                   prefix=prefix, eolmode=eolmode)
             def _canonprefix(repo, prefix):
                 if prefix:
                     prefix = pathutil.canonpath(repo.root, repo.getcwd(), prefix)
                     if prefix != '':
                         prefix += '/'
                 return prefix
             def _applydiff(ui, fp, patcher, backend, store, strip=1, prefix='',
                            eolmode='strict'):
                 prefix = _canonprefix(backend.repo, prefix)
                 def pstrip(p):
                     return pathtransform(p, strip - 1, prefix)[1]
                 rejects = 0
                 err = 0
                 current_file = None
                 for state, values in iterhunks(fp):
                     if state == 'hunk':
                         if not current_file:
                             continue
                         ret = current_file.apply(values)
                         if ret > 0:
                             err = 1
                     elif state == 'file':
                         if current_file:
                             rejects += current_file.close()
                             current_file = None
                         afile, bfile, first_hunk, gp = values
                         if gp:
                             gp.path = pstrip(gp.path)
                             if gp.oldpath:
                                 gp.oldpath = pstrip(gp.oldpath)
                         else:
                             gp = makepatchmeta(backend, afile, bfile, first_hunk, strip,
                                                prefix)
                         if gp.op == 'RENAME':
                             backend.unlink(gp.oldpath)
                         if not first_hunk:
                             if gp.op == 'DELETE':
                                 backend.unlink(gp.path)
                                 continue
                             data, mode = None, None
                             if gp.op in ('RENAME', 'COPY'):
                                 data, mode = store.getfile(gp.oldpath)[:2]
                                 if data is None:
                                     # This means that the old path does not exist
                                     raise PatchError(_("source file '%s' does not exist")
                                                        % gp.oldpath)
                             if gp.mode:
                                 mode = gp.mode
                                 if gp.op == 'ADD':
                                     # Added files without content have no hunk and
                                     # must be created
                                     data = ''
                             if data or mode:
                                 if (gp.op in ('ADD', 'RENAME', 'COPY')
                                     and backend.exists(gp.path)):
                                     raise PatchError(_("cannot create %s: destination "
                                                        "already exists") % gp.path)
                                 backend.setfile(gp.path, data, mode, gp.oldpath)
                             continue
                         try:
                             current_file = patcher(ui, gp, backend, store,
                                                    eolmode=eolmode)
                         except PatchError as inst:
                             ui.warn(str(inst) + '\n')
                             current_file = None
                             rejects += 1
                             continue
                     elif state == 'git':
                         for gp in values:
                             path = pstrip(gp.oldpath)
                             data, mode = backend.getfile(path)
                             if data is None:
                                 # The error ignored here will trigger a getfile()
                                 # error in a place more appropriate for error
                                 # handling, and will not interrupt the patching
                                 # process.
                                 pass
                             else:
                                 store.setfile(path, data, mode)
                     else:
                         raise error.Abort(_('unsupported parser state: %s') % state)
                 if current_file:
                     rejects += current_file.close()
                 if rejects:
                     return -1
                 return err
             def _externalpatch(ui, repo, patcher, patchname, strip, files,
                                similarity):
                 """use <patcher> to apply <patchname> to the working directory.
                 returns whether patch was applied with fuzz factor."""
                 fuzz = False
                 args = []
                 cwd = repo.root
                 if cwd:
                     args.append('-d %s' % procutil.shellquote(cwd))
                 cmd = ('%s %s -p%d < %s'
                        % (patcher, ' '.join(args), strip, procutil.shellquote(patchname)))
                 ui.debug('Using external patch tool: %s\n' % cmd)
                 fp = procutil.popen(cmd, 'rb')
                 try:
                     for line in util.iterfile(fp):
                         line = line.rstrip()
                         ui.note(line + '\n')
                         if line.startswith('patching file '):
                             pf = util.parsepatchoutput(line)
                             printed_file = False
                             files.add(pf)
                         elif line.find('with fuzz') >= 0:
                             fuzz = True
                             if not printed_file:
                                 ui.warn(pf + '\n')
                                 printed_file = True
                             ui.warn(line + '\n')
                         elif line.find('saving rejects to file') >= 0:
                             ui.warn(line + '\n')
                         elif line.find('FAILED') >= 0:
                             if not printed_file:
                                 ui.warn(pf + '\n')
                                 printed_file = True
                             ui.warn(line + '\n')
                 finally:
                     if files:
                         scmutil.marktouched(repo, files, similarity)
                 code = fp.close()
                 if code:
                     raise PatchError(_("patch command failed: %s") %
                                      procutil.explainexit(code))
                 return fuzz
             def patchbackend(ui, backend, patchobj, strip, prefix, files=None,
                              eolmode='strict'):
                 if files is None:
                     files = set()
                 if eolmode is None:
                     eolmode = ui.config('patch', 'eol')
                 if eolmode.lower() not in eolmodes:
                     raise error.Abort(_('unsupported line endings type: %s') % eolmode)
                 eolmode = eolmode.lower()
                 store = filestore()
                 try:
                     fp = open(patchobj, 'rb')
                 except TypeError:
                     fp = patchobj
                 try:
                     ret = applydiff(ui, fp, backend, store, strip=strip, prefix=prefix,
                                     eolmode=eolmode)
                 finally:
                     if fp != patchobj:
                         fp.close()
                     files.update(backend.close())
                     store.close()
                 if ret < 0:
                     raise PatchError(_('patch failed to apply'))
                 return ret > 0
             def internalpatch(ui, repo, patchobj, strip, prefix='', files=None,
                               eolmode='strict', similarity=0):
                 """use builtin patch to apply <patchobj> to the working directory.
                 returns whether patch was applied with fuzz factor."""
                 backend = workingbackend(ui, repo, similarity)
                 return patchbackend(ui, backend, patchobj, strip, prefix, files, eolmode)
             def patchrepo(ui, repo, ctx, store, patchobj, strip, prefix, files=None,
                           eolmode='strict'):
                 backend = repobackend(ui, repo, ctx, store)
                 return patchbackend(ui, backend, patchobj, strip, prefix, files, eolmode)
             def patch(ui, repo, patchname, strip=1, prefix='', files=None, eolmode='strict',
                       similarity=0):
                 """Apply <patchname> to the working directory.
                 'eolmode' specifies how end of lines should be handled. It can be:
                 - 'strict': inputs are read in binary mode, EOLs are preserved
                 - 'crlf': EOLs are ignored when patching and reset to CRLF
                 - 'lf': EOLs are ignored when patching and reset to LF
                 - None: get it from user settings, default to 'strict'
                 'eolmode' is ignored when using an external patcher program.
                 Returns whether patch was applied with fuzz factor.
                 """
                 patcher = ui.config('ui', 'patch')
                 if files is None:
                     files = set()
                 if patcher:
                     return _externalpatch(ui, repo, patcher, patchname, strip,
                                           files, similarity)
                 return internalpatch(ui, repo, patchname, strip, prefix, files, eolmode,
                                      similarity)
             def changedfiles(ui, repo, patchpath, strip=1, prefix=''):
                 backend = fsbackend(ui, repo.root)
                 prefix = _canonprefix(repo, prefix)
                 with open(patchpath, 'rb') as fp:
                     changed = set()
                     for state, values in iterhunks(fp):
                         if state == 'file':
                             afile, bfile, first_hunk, gp = values
                             if gp:
                                 gp.path = pathtransform(gp.path, strip - 1, prefix)[1]
                                 if gp.oldpath:
                                     gp.oldpath = pathtransform(gp.oldpath, strip - 1,
                                                                prefix)[1]
                             else:
                                 gp = makepatchmeta(backend, afile, bfile, first_hunk, strip,
                                                    prefix)
                             changed.add(gp.path)
                             if gp.op == 'RENAME':
                                 changed.add(gp.oldpath)
                         elif state not in ('hunk', 'git'):
                             raise error.Abort(_('unsupported parser state: %s') % state)
                     return changed
             class GitDiffRequired(Exception):
                 pass
             diffopts = diffutil.diffallopts
             diffallopts = diffutil.diffallopts
             difffeatureopts = diffutil.difffeatureopts
             def diff(repo, node1=None, node2=None, match=None, changes=None,
                      opts=None, losedatafn=None, pathfn=None, copy=None,
                      copysourcematch=None, hunksfilterfn=None):
                 '''yields diff of changes to files between two nodes, or node and
                 working directory.
                 if node1 is None, use first dirstate parent instead.
                 if node2 is None, compare node1 with working directory.
                 losedatafn(**kwarg) is a callable run when opts.upgrade=True and
                 every time some change cannot be represented with the current
                 patch format. Return False to upgrade to git patch format, True to
                 accept the loss or raise an exception to abort the diff. It is
                 called with the name of current file being diffed as 'fn'. If set
                 to None, patches will always be upgraded to git format when
                 necessary.
                 prefix is a filename prefix that is prepended to all filenames on
                 display (used for subrepos).
                 relroot, if not empty, must be normalized with a trailing /. Any match
                 patterns that fall outside it will be ignored.
                 copy, if not empty, should contain mappings {dst@y: src@x} of copy
                 information.
                 if copysourcematch is not None, then copy sources will be filtered by this
                 matcher
                 hunksfilterfn, if not None, should be a function taking a filectx and
                 hunks generator that may yield filtered hunks.
                 '''
                 if not node1 and not node2:
                     node1 = repo.dirstate.p1()
                 ctx1 = repo[node1]
                 ctx2 = repo[node2]
                 for fctx1, fctx2, hdr, hunks in diffhunks(
                         repo, ctx1=ctx1, ctx2=ctx2, match=match, changes=changes, opts=opts,
                         losedatafn=losedatafn, pathfn=pathfn, copy=copy,
                         copysourcematch=copysourcematch):
                     if hunksfilterfn is not None:
                         # If the file has been removed, fctx2 is None; but this should
                         # not occur here since we catch removed files early in
                         # logcmdutil.getlinerangerevs() for 'hg log -L'.
                         assert fctx2 is not None, (
                             'fctx2 unexpectly None in diff hunks filtering')
                         hunks = hunksfilterfn(fctx2, hunks)
                     text = ''.join(sum((list(hlines) for hrange, hlines in hunks), []))
                     if hdr and (text or len(hdr) > 1):
                         yield '\n'.join(hdr) + '\n'
                     if text:
                         yield text
             def diffhunks(repo, ctx1, ctx2, match=None, changes=None, opts=None,
                           losedatafn=None, pathfn=None, copy=None, copysourcematch=None):
                 """Yield diff of changes to files in the form of (`header`, `hunks`) tuples
                 where `header` is a list of diff headers and `hunks` is an iterable of
                 (`hunkrange`, `hunklines`) tuples.
                 See diff() for the meaning of parameters.
                 """
                 if opts is None:
                     opts = mdiff.defaultopts
                 def lrugetfilectx():
                     cache = {}
                     order = collections.deque()
                     def getfilectx(f, ctx):
                         fctx = ctx.filectx(f, filelog=cache.get(f))
                         if f not in cache:
                             if len(cache) > 20:
                                 del cache[order.popleft()]
                             cache[f] = fctx.filelog()
                         else:
                             order.remove(f)
                         order.append(f)
                         return fctx
                     return getfilectx
                 getfilectx = lrugetfilectx()
                 if not changes:
                     changes = ctx1.status(ctx2, match=match)
                 modified, added, removed = changes[:3]
                 if not modified and not added and not removed:
                     return []
                 if repo.ui.debugflag:
                     hexfunc = hex
                 else:
                     hexfunc = short
                 revs = [hexfunc(node) for node in [ctx1.node(), ctx2.node()] if node]
                 if copy is None:
                     copy = {}
                     if opts.git or opts.upgrade:
                         copy = copies.pathcopies(ctx1, ctx2, match=match)
                 if copysourcematch:
                     # filter out copies where source side isn't inside the matcher
                     # (copies.pathcopies() already filtered out the destination)
                     copy = {dst: src for dst, src in copy.iteritems()
                             if copysourcematch(src)}
                 modifiedset = set(modified)
                 addedset = set(added)
                 removedset = set(removed)
                 for f in modified:
                     if f not in ctx1:
                         # Fix up added, since merged-in additions appear as
                         # modifications during merges
                         modifiedset.remove(f)
                         addedset.add(f)
                 for f in removed:
                     if f not in ctx1:
                         # Merged-in additions that are then removed are reported as removed.
                         # They are not in ctx1, so We don't want to show them in the diff.
                         removedset.remove(f)
                 modified = sorted(modifiedset)
                 added = sorted(addedset)
                 removed = sorted(removedset)
                 for dst, src in list(copy.items()):
                     if src not in ctx1:
                         # Files merged in during a merge and then copied/renamed are
                         # reported as copies. We want to show them in the diff as additions.
                         del copy[dst]
                 prefetchmatch = scmutil.matchfiles(
                     repo, list(modifiedset | addedset | removedset))
                 scmutil.prefetchfiles(repo, [ctx1.rev(), ctx2.rev()], prefetchmatch)
                 def difffn(opts, losedata):
                     return trydiff(repo, revs, ctx1, ctx2, modified, added, removed,
                                    copy, getfilectx, opts, losedata, pathfn)
                 if opts.upgrade and not opts.git:
                     try:
                         def losedata(fn):
                             if not losedatafn or not losedatafn(fn=fn):
                                 raise GitDiffRequired
                         # Buffer the whole output until we are sure it can be generated
                         return list(difffn(opts.copy(git=False), losedata))
                     except GitDiffRequired:
                         return difffn(opts.copy(git=True), None)
                 else:
                     return difffn(opts, None)
             def diffsinglehunk(hunklines):
                 """yield tokens for a list of lines in a single hunk"""
                 for line in hunklines:
                     # chomp
                     chompline = line.rstrip('\r\n')
                     # highlight tabs and trailing whitespace
                     stripline = chompline.rstrip()
                     if line.startswith('-'):
                         label = 'diff.deleted'
                     elif line.startswith('+'):
                         label = 'diff.inserted'
                     else:
                         raise error.ProgrammingError('unexpected hunk line: %s' % line)
                     for token in tabsplitter.findall(stripline):
                         if token.startswith('\t'):
                             yield (token, 'diff.tab')
                         else:
                             yield (token, label)
                     if chompline != stripline:
                         yield (chompline[len(stripline):], 'diff.trailingwhitespace')
                     if chompline != line:
                         yield (line[len(chompline):], '')
             def diffsinglehunkinline(hunklines):
                 """yield tokens for a list of lines in a single hunk, with inline colors"""
                 # prepare deleted, and inserted content
                 a = ''
                 b = ''
                 for line in hunklines:
                     if line[0:1] == '-':
                         a += line[1:]
                     elif line[0:1] == '+':
                         b += line[1:]
                     else:
                         raise error.ProgrammingError('unexpected hunk line: %s' % line)
                 # fast path: if either side is empty, use diffsinglehunk
                 if not a or not b:
                     for t in diffsinglehunk(hunklines):
                         yield t
                     return
                 # re-split the content into words
                 al = wordsplitter.findall(a)
                 bl = wordsplitter.findall(b)
                 # re-arrange the words to lines since the diff algorithm is line-based
                 aln = [s if s == '\n' else s + '\n' for s in al]
                 bln = [s if s == '\n' else s + '\n' for s in bl]
                 an = ''.join(aln)
                 bn = ''.join(bln)
                 # run the diff algorithm, prepare atokens and btokens
                 atokens = []
                 btokens = []
                 blocks = mdiff.allblocks(an, bn, lines1=aln, lines2=bln)
                 for (a1, a2, b1, b2), btype in blocks:
                     changed = btype == '!'
                     for token in mdiff.splitnewlines(''.join(al[a1:a2])):
                         atokens.append((changed, token))
                     for token in mdiff.splitnewlines(''.join(bl[b1:b2])):
                         btokens.append((changed, token))
                 # yield deleted tokens, then inserted ones
                 for prefix, label, tokens in [('-', 'diff.deleted', atokens),
                                               ('+', 'diff.inserted', btokens)]:
                     nextisnewline = True
                     for changed, token in tokens:
                         if nextisnewline:
                             yield (prefix, label)
                             nextisnewline = False
                         # special handling line end
                         isendofline = token.endswith('\n')
                         if isendofline:
                             chomp = token[:-1] # chomp
                             if chomp.endswith('\r'):
                                 chomp = chomp[:-1]
                             endofline = token[len(chomp):]
                             token = chomp.rstrip() # detect spaces at the end
                             endspaces = chomp[len(token):]
                         # scan tabs
                         for maybetab in tabsplitter.findall(token):
                             if b'\t' == maybetab[0:1]:
                                 currentlabel = 'diff.tab'
                             else:
                                 if changed:
                                     currentlabel = label + '.changed'
                                 else:
                                     currentlabel = label + '.unchanged'
                             yield (maybetab, currentlabel)
                         if isendofline:
                             if endspaces:
                                 yield (endspaces, 'diff.trailingwhitespace')
                             yield (endofline, '')
                             nextisnewline = True
             def difflabel(func, *args, **kw):
                 '''yields 2-tuples of (output, label) based on the output of func()'''
                 if kw.get(r'opts') and kw[r'opts'].worddiff:
                     dodiffhunk = diffsinglehunkinline
                 else:
                     dodiffhunk = diffsinglehunk
                 headprefixes = [('diff', 'diff.diffline'),
                                 ('copy', 'diff.extended'),
                                 ('rename', 'diff.extended'),
                                 ('old', 'diff.extended'),
                                 ('new', 'diff.extended'),
                                 ('deleted', 'diff.extended'),
                                 ('index', 'diff.extended'),
                                 ('similarity', 'diff.extended'),
                                 ('---', 'diff.file_a'),
                                 ('+++', 'diff.file_b')]
                 textprefixes = [('@', 'diff.hunk'),
                                 # - and + are handled by diffsinglehunk
                                ]
                 head = False
                 # buffers a hunk, i.e. adjacent "-", "+" lines without other changes.
                 hunkbuffer = []
                 def consumehunkbuffer():
                     if hunkbuffer:
                         for token in dodiffhunk(hunkbuffer):
                             yield token
                         hunkbuffer[:] = []
                 for chunk in func(*args, **kw):
                     lines = chunk.split('\n')
                     linecount = len(lines)
                     for i, line in enumerate(lines):
                         if head:
                             if line.startswith('@'):
                                 head = False
                         else:
                             if line and not line.startswith((' ', '+', '-', '@', '\\')):
                                 head = True
                         diffline = False
                         if not head and line and line.startswith(('+', '-')):
                             diffline = True
                         prefixes = textprefixes
                         if head:
                             prefixes = headprefixes
                         if diffline:
                             # buffered
                             bufferedline = line
                             if i + 1 < linecount:
                                 bufferedline += "\n"
                             hunkbuffer.append(bufferedline)
                         else:
                             # unbuffered
                             for token in consumehunkbuffer():
                                 yield token
                             stripline = line.rstrip()
                             for prefix, label in prefixes:
                                 if stripline.startswith(prefix):
                                     yield (stripline, label)
                                     if line != stripline:
                                         yield (line[len(stripline):],
                                                'diff.trailingwhitespace')
                                     break
                             else:
                                 yield (line, '')
                             if i + 1 < linecount:
                                 yield ('\n', '')
                     for token in consumehunkbuffer():
                         yield token
             def diffui(*args, **kw):
                 '''like diff(), but yields 2-tuples of (output, label) for ui.write()'''
                 return difflabel(diff, *args, **kw)
             def _filepairs(modified, added, removed, copy, opts):
                 '''generates tuples (f1, f2, copyop), where f1 is the name of the file
                 before and f2 is the the name after. For added files, f1 will be None,
                 and for removed files, f2 will be None. copyop may be set to None, 'copy'
                 or 'rename' (the latter two only if opts.git is set).'''
                 gone = set()
                 copyto = dict([(v, k) for k, v in copy.items()])
                 addedset, removedset = set(added), set(removed)
                 for f in sorted(modified + added + removed):
                     copyop = None
                     f1, f2 = f, f
                     if f in addedset:
                         f1 = None
                         if f in copy:
                             if opts.git:
                                 f1 = copy[f]
                                 if f1 in removedset and f1 not in gone:
                                     copyop = 'rename'
                                     gone.add(f1)
                                 else:
                                     copyop = 'copy'
                     elif f in removedset:
                         f2 = None
                         if opts.git:
                             # have we already reported a copy above?
                             if (f in copyto and copyto[f] in addedset
                                 and copy[copyto[f]] == f):
                                 continue
                     yield f1, f2, copyop
             def trydiff(repo, revs, ctx1, ctx2, modified, added, removed,
                         copy, getfilectx, opts, losedatafn, pathfn):
                 '''given input data, generate a diff and yield it in blocks
                 If generating a diff would lose data like flags or binary data and
                 losedatafn is not None, it will be called.
                 pathfn is applied to every path in the diff output.
                 '''
                 def gitindex(text):
                     if not text:
                         text = ""
                     l = len(text)
                     s = hashlib.sha1('blob %d\0' % l)
                     s.update(text)
                     return hex(s.digest())
                 if opts.noprefix:
                     aprefix = bprefix = ''
                 else:
                     aprefix = 'a/'
                     bprefix = 'b/'
                 def diffline(f, revs):
                     revinfo = ' '.join(["-r %s" % rev for rev in revs])
                     return 'diff %s %s' % (revinfo, f)
                 def isempty(fctx):
                     return fctx is None or fctx.size() == 0
                 date1 = dateutil.datestr(ctx1.date())
                 date2 = dateutil.datestr(ctx2.date())
                 gitmode = {'l': '120000', 'x': '100755', '': '100644'}
                 if not pathfn:
                     pathfn = lambda f: f
                 for f1, f2, copyop in _filepairs(modified, added, removed, copy, opts):
                     content1 = None
                     content2 = None
                     fctx1 = None
                     fctx2 = None
                     flag1 = None
                     flag2 = None
                     if f1:
                         fctx1 = getfilectx(f1, ctx1)
                         if opts.git or losedatafn:
                             flag1 = ctx1.flags(f1)
                     if f2:
                         fctx2 = getfilectx(f2, ctx2)
                         if opts.git or losedatafn:
                             flag2 = ctx2.flags(f2)
                     # if binary is True, output "summary" or "base85", but not "text diff"
                     if opts.text:
                         binary = False
                     else:
                         binary = any(f.isbinary() for f in [fctx1, fctx2] if f is not None)
                     if losedatafn and not opts.git:
                         if (binary or
                             # copy/rename
                             f2 in copy or
                             # empty file creation
                             (not f1 and isempty(fctx2)) or
                             # empty file deletion
                             (isempty(fctx1) and not f2) or
                             # create with flags
                             (not f1 and flag2) or
                             # change flags
                             (f1 and f2 and flag1 != flag2)):
                             losedatafn(f2 or f1)
                     path1 = pathfn(f1 or f2)
                     path2 = pathfn(f2 or f1)
                     header = []
                     if opts.git:
                         header.append('diff --git %s%s %s%s' %
                                       (aprefix, path1, bprefix, path2))
                         if not f1: # added
                             header.append('new file mode %s' % gitmode[flag2])
                         elif not f2: # removed
                             header.append('deleted file mode %s' % gitmode[flag1])
                         else:  # modified/copied/renamed
                             mode1, mode2 = gitmode[flag1], gitmode[flag2]
                             if mode1 != mode2:
                                 header.append('old mode %s' % mode1)
                                 header.append('new mode %s' % mode2)
                             if copyop is not None:
                                 if opts.showsimilarity:
                                     sim = similar.score(ctx1[path1], ctx2[path2]) * 100
                                     header.append('similarity index %d%%' % sim)
                                 header.append('%s from %s' % (copyop, path1))
                                 header.append('%s to %s' % (copyop, path2))
                     elif revs:
                         header.append(diffline(path1, revs))
                     #  fctx.is  | diffopts                | what to   | is fctx.data()
                     #  binary() | text nobinary git index | output?   | outputted?
                     # ------------------------------------|----------------------------
                     #  yes      | no   no       no  *     | summary   | no
                     #  yes      | no   no       yes *     | base85    | yes
                     #  yes      | no   yes      no  *     | summary   | no
                     #  yes      | no   yes      yes 0     | summary   | no
                     #  yes      | no   yes      yes >0    | summary   | semi [1]
                     #  yes      | yes  *        *   *     | text diff | yes
                     #  no       | *    *        *   *     | text diff | yes
                     # [1]: hash(fctx.data()) is outputted. so fctx.data() cannot be faked
                     if binary and (not opts.git or (opts.git and opts.nobinary and not
                                                     opts.index)):
                         # fast path: no binary content will be displayed, content1 and
                         # content2 are only used for equivalent test. cmp() could have a
                         # fast path.
                         if fctx1 is not None:
                             content1 = b'\0'
                         if fctx2 is not None:
                             if fctx1 is not None and not fctx1.cmp(fctx2):
                                 content2 = b'\0' # not different
                             else:
                                 content2 = b'\0\0'
                     else:
                         # normal path: load contents
                         if fctx1 is not None:
                             content1 = fctx1.data()
                         if fctx2 is not None:
                             content2 = fctx2.data()
                     if binary and opts.git and not opts.nobinary:
                         text = mdiff.b85diff(content1, content2)
                         if text:
                             header.append('index %s..%s' %
                                           (gitindex(content1), gitindex(content2)))
                         hunks = (None, [text]),
                     else:
                         if opts.git and opts.index > 0:
                             flag = flag1
                             if flag is None:
                                 flag = flag2
                             header.append('index %s..%s %s' %
                                           (gitindex(content1)[0:opts.index],
                                            gitindex(content2)[0:opts.index],
                                            gitmode[flag]))
                         uheaders, hunks = mdiff.unidiff(content1, date1,
                                                         content2, date2,
                                                         path1, path2,
                                                         binary=binary, opts=opts)
                         header.extend(uheaders)
                     yield fctx1, fctx2, header, hunks
             def diffstatsum(stats):
                 maxfile, maxtotal, addtotal, removetotal, binary = 0, 0, 0, 0, False
                 for f, a, r, b in stats:
                     maxfile = max(maxfile, encoding.colwidth(f))
                     maxtotal = max(maxtotal, a + r)
                     addtotal += a
                     removetotal += r
                     binary = binary or b
                 return maxfile, maxtotal, addtotal, removetotal, binary
             def diffstatdata(lines):
                 diffre = re.compile(br'^diff .*-r [a-z0-9]+\s(.*)$')
                 results = []
                 filename, adds, removes, isbinary = None, 0, 0, False
                 def addresult():
                     if filename:
                         results.append((filename, adds, removes, isbinary))
                 # inheader is used to track if a line is in the
                 # header portion of the diff.  This helps properly account
                 # for lines that start with '--' or '++'
                 inheader = False
                 for line in lines:
                     if line.startswith('diff'):
                         addresult()
                         # starting a new file diff
                         # set numbers to 0 and reset inheader
                         inheader = True
                         adds, removes, isbinary = 0, 0, False
                         if line.startswith('diff --git a/'):
                             filename = gitre.search(line).group(2)
                         elif line.startswith('diff -r'):
                             # format: "diff -r ... -r ... filename"
                             filename = diffre.search(line).group(1)
                     elif line.startswith('@@'):
                         inheader = False
                     elif line.startswith('+') and not inheader:
                         adds += 1
                     elif line.startswith('-') and not inheader:
                         removes += 1
                     elif (line.startswith('GIT binary patch') or
                           line.startswith('Binary file')):
                         isbinary = True
                     elif line.startswith('rename from'):
                         filename = line[12:]
                     elif line.startswith('rename to'):
                         filename += ' => %s' % line[10:]
                 addresult()
                 return results
             def diffstat(lines, width=80):
                 output = []
                 stats = diffstatdata(lines)
                 maxname, maxtotal, totaladds, totalremoves, hasbinary = diffstatsum(stats)
                 countwidth = len(str(maxtotal))
                 if hasbinary and countwidth < 3:
                     countwidth = 3
                 graphwidth = width - countwidth - maxname - 6
                 if graphwidth < 10:
                     graphwidth = 10
                 def scale(i):
                     if maxtotal <= graphwidth:
                         return i
                     # If diffstat runs out of room it doesn't print anything,
                     # which isn't very useful, so always print at least one + or -
                     # if there were at least some changes.
                     return max(i * graphwidth // maxtotal, int(bool(i)))
                 for filename, adds, removes, isbinary in stats:
                     if isbinary:
                         count = 'Bin'
                     else:
                         count = '%d' % (adds + removes)
                     pluses = '+' * scale(adds)
                     minuses = '-' * scale(removes)
                     output.append(' %s%s |  %*s %s%s\n' %
                                   (filename, ' ' * (maxname - encoding.colwidth(filename)),
                                    countwidth, count, pluses, minuses))
                 if stats:
                     output.append(_(' %d files changed, %d insertions(+), '
                                     '%d deletions(-)\n')
                                   % (len(stats), totaladds, totalremoves))
                 return ''.join(output)
             def diffstatui(*args, **kw):
                 '''like diffstat(), but yields 2-tuples of (output, label) for
                 ui.write()
                 '''
                 for line in diffstat(*args, **kw).splitlines():
                     if line and line[-1] in '+-':
                         name, graph = line.rsplit(' ', 1)
                         yield (name + ' ', '')
                         m = re.search(br'\++', graph)
                         if m:
                             yield (m.group(0), 'diffstat.inserted')
                         m = re.search(br'-+', graph)
                         if m:
                             yield (m.group(0), 'diffstat.deleted')
                     else:
                         yield (line, '')
                     yield ('\n', '')