upstream/kallithea Commit - r3047:3b3de7c6

1

# -*- coding: utf-8 -*-

1

# -*- coding: utf-8 -*-

2

"""

2

"""

3

rhodecode.lib.diffs

3

rhodecode.lib.diffs

4

~~~~~~~~~~~~~~~~~~~

4

~~~~~~~~~~~~~~~~~~~

5

6

Set of diffing helpers, previously part of vcs

6

Set of diffing helpers, previously part of vcs

7

8

9

:created_on: Dec 4, 2011

9

:created_on: Dec 4, 2011

10

:author: marcink

10

:author: marcink

11

12

:original copyright: 2007-2008 by Armin Ronacher

12

:original copyright: 2007-2008 by Armin Ronacher

13

:license: GPLv3, see COPYING for more details.

13

:license: GPLv3, see COPYING for more details.

14

"""

14

"""

15

# This program is free software: you can redistribute it and/or modify

15

# This program is free software: you can redistribute it and/or modify

16

# it under the terms of the GNU General Public License as published by

16

# it under the terms of the GNU General Public License as published by

17

# the Free Software Foundation, either version 3 of the License, or

17

# the Free Software Foundation, either version 3 of the License, or

18

# (at your option) any later version.

18

# (at your option) any later version.

19

#

19

#

20

# This program is distributed in the hope that it will be useful,

20

# This program is distributed in the hope that it will be useful,

21

# but WITHOUT ANY WARRANTY; without even the implied warranty of

21

# but WITHOUT ANY WARRANTY; without even the implied warranty of

22

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

22

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

23

# GNU General Public License for more details.

23

# GNU General Public License for more details.

24

#

24

#

25

# You should have received a copy of the GNU General Public License

25

# You should have received a copy of the GNU General Public License

26

# along with this program. If not, see <http://www.gnu.org/licenses/>.

26

# along with this program. If not, see <http://www.gnu.org/licenses/>.

27

28

import re

28

import re

29

import difflib

29

import difflib

30

import logging

30

import logging

31

import traceback

31

import traceback

32

33

from itertools import tee, imap

33

from itertools import tee, imap

34

35

from mercurial import patch

35

from mercurial import patch

36

from mercurial.mdiff import diffopts

36

from mercurial.mdiff import diffopts

37

from mercurial.bundlerepo import bundlerepository

37

from mercurial.bundlerepo import bundlerepository

38

39

from pylons.i18n.translation import _

39

from pylons.i18n.translation import _

40

41

from rhodecode.lib.compat import BytesIO

41

from rhodecode.lib.compat import BytesIO

42

from rhodecode.lib.vcs.utils.hgcompat import localrepo

42

from rhodecode.lib.vcs.utils.hgcompat import localrepo

43

from rhodecode.lib.vcs.exceptions import VCSError

43

from rhodecode.lib.vcs.exceptions import VCSError

44

from rhodecode.lib.vcs.nodes import FileNode, SubModuleNode

44

from rhodecode.lib.vcs.nodes import FileNode, SubModuleNode

45

from rhodecode.lib.vcs.backends.base import EmptyChangeset

45

from rhodecode.lib.vcs.backends.base import EmptyChangeset

46

from rhodecode.lib.helpers import escape

46

from rhodecode.lib.helpers import escape

47

from rhodecode.lib.utils import make_ui

47

from rhodecode.lib.utils import make_ui

48

from rhodecode.lib.utils2 import safe_unicode

48

from rhodecode.lib.utils2 import safe_unicode

49

50

log = logging.getLogger(__name__)

50

log = logging.getLogger(__name__)

51

52

53

def wrap_to_table(str_):

53

def wrap_to_table(str_):

54

return '''<table class="code-difftable">

54

return '''<table class="code-difftable">

55

55

56

56

57

57

58

</tr>

58

</tr>

59

</table>''' % str_

59

</table>''' % str_

60

61

62

def wrapped_diff(filenode_old, filenode_new, cut_off_limit=None,

62

def wrapped_diff(filenode_old, filenode_new, cut_off_limit=None,

63

ignore_whitespace=True, line_context=3,

63

ignore_whitespace=True, line_context=3,

64

enable_comments=False):

64

enable_comments=False):

65

"""

65

"""

66

returns a wrapped diff into a table, checks for cut_off_limit and presents

66

returns a wrapped diff into a table, checks for cut_off_limit and presents

67

proper message

67

proper message

68

"""

68

"""

69

70

if filenode_old is None:

70

if filenode_old is None:

71

filenode_old = FileNode(filenode_new.path, '', EmptyChangeset())

71

filenode_old = FileNode(filenode_new.path, '', EmptyChangeset())

72

73

if filenode_old.is_binary or filenode_new.is_binary:

73

if filenode_old.is_binary or filenode_new.is_binary:

74

diff = wrap_to_table(_('binary file'))

74

diff = wrap_to_table(_('binary file'))

75

stats = (0, 0)

75

stats = (0, 0)

76

size = 0

76

size = 0

77

78

elif cut_off_limit != -1 and (cut_off_limit is None or

78

elif cut_off_limit != -1 and (cut_off_limit is None or

79

(filenode_old.size < cut_off_limit and filenode_new.size < cut_off_limit)):

79

(filenode_old.size < cut_off_limit and filenode_new.size < cut_off_limit)):

80

81

f_gitdiff = get_gitdiff(filenode_old, filenode_new,

81

f_gitdiff = get_gitdiff(filenode_old, filenode_new,

82

ignore_whitespace=ignore_whitespace,

82

ignore_whitespace=ignore_whitespace,

83

context=line_context)

83

context=line_context)

84

diff_processor = DiffProcessor(f_gitdiff, format='gitdiff')

84

diff_processor = DiffProcessor(f_gitdiff, format='gitdiff')

85

86

diff = diff_processor.as_html(enable_comments=enable_comments)

86

diff = diff_processor.as_html(enable_comments=enable_comments)

87

stats = diff_processor.stat()

87

stats = diff_processor.stat()

88

size = len(diff or '')

88

size = len(diff or '')

89

else:

89

else:

90

diff = wrap_to_table(_('Changeset was too big and was cut off, use '

90

diff = wrap_to_table(_('Changeset was too big and was cut off, use '

91

'diff menu to display this diff'))

91

'diff menu to display this diff'))

92

stats = (0, 0)

92

stats = (0, 0)

93

size = 0

93

size = 0

94

if not diff:

94

if not diff:

95

submodules = filter(lambda o: isinstance(o, SubModuleNode),

95

submodules = filter(lambda o: isinstance(o, SubModuleNode),

96

[filenode_new, filenode_old])

96

[filenode_new, filenode_old])

97

if submodules:

97

if submodules:

98

diff = wrap_to_table(escape('Submodule %r' % submodules[0]))

98

diff = wrap_to_table(escape('Submodule %r' % submodules[0]))

99

else:

99

else:

100

diff = wrap_to_table(_('No changes detected'))

100

diff = wrap_to_table(_('No changes detected'))

101

102

cs1 = filenode_old.changeset.raw_id

102

cs1 = filenode_old.changeset.raw_id

103

cs2 = filenode_new.changeset.raw_id

103

cs2 = filenode_new.changeset.raw_id

104

105

return size, cs1, cs2, diff, stats

105

return size, cs1, cs2, diff, stats

106

107

108

def get_gitdiff(filenode_old, filenode_new, ignore_whitespace=True, context=3):

108

def get_gitdiff(filenode_old, filenode_new, ignore_whitespace=True, context=3):

109

"""

109

"""

110

Returns git style diff between given ``filenode_old`` and ``filenode_new``.

110

Returns git style diff between given ``filenode_old`` and ``filenode_new``.

111

112

:param ignore_whitespace: ignore whitespaces in diff

112

:param ignore_whitespace: ignore whitespaces in diff

113

"""

113

"""

114

# make sure we pass in default context

114

# make sure we pass in default context

115

context = context or 3

115

context = context or 3

116

submodules = filter(lambda o: isinstance(o, SubModuleNode),

116

submodules = filter(lambda o: isinstance(o, SubModuleNode),

117

[filenode_new, filenode_old])

117

[filenode_new, filenode_old])

118

if submodules:

118

if submodules:

119

return ''

119

return ''

120

121

for filenode in (filenode_old, filenode_new):

121

for filenode in (filenode_old, filenode_new):

122

if not isinstance(filenode, FileNode):

122

if not isinstance(filenode, FileNode):

123

raise VCSError("Given object should be FileNode object, not %s"

123

raise VCSError("Given object should be FileNode object, not %s"

124

% filenode.__class__)

124

% filenode.__class__)

125

126

repo = filenode_new.changeset.repository

126

repo = filenode_new.changeset.repository

127

old_raw_id = getattr(filenode_old.changeset, 'raw_id', repo.EMPTY_CHANGESET)

127

old_raw_id = getattr(filenode_old.changeset, 'raw_id', repo.EMPTY_CHANGESET)

128

new_raw_id = getattr(filenode_new.changeset, 'raw_id', repo.EMPTY_CHANGESET)

128

new_raw_id = getattr(filenode_new.changeset, 'raw_id', repo.EMPTY_CHANGESET)

129

130

vcs_gitdiff = repo.get_diff(old_raw_id, new_raw_id, filenode_new.path,

130

vcs_gitdiff = repo.get_diff(old_raw_id, new_raw_id, filenode_new.path,

131

ignore_whitespace, context)

131

ignore_whitespace, context)

132

return vcs_gitdiff

132

return vcs_gitdiff

133

134

NEW_FILENODE = 1

134

NEW_FILENODE = 1

135

DEL_FILENODE = 2

135

DEL_FILENODE = 2

136

MOD_FILENODE = 3

136

MOD_FILENODE = 3

137

RENAMED_FILENODE = 4

137

RENAMED_FILENODE = 4

138

CHMOD_FILENODE = 5

138

CHMOD_FILENODE = 5

139

140

141

class DiffLimitExceeded(Exception):

141

class DiffLimitExceeded(Exception):

142

pass

142

pass

143

144

145

class LimitedDiffContainer(object):

145

class LimitedDiffContainer(object):

146

147

def __init__(self, diff_limit, cur_diff_size, diff):

147

def __init__(self, diff_limit, cur_diff_size, diff):

148

self.diff = diff

148

self.diff = diff

149

self.diff_limit = diff_limit

149

self.diff_limit = diff_limit

150

self.cur_diff_size = cur_diff_size

150

self.cur_diff_size = cur_diff_size

151

152

def __iter__(self):

152

def __iter__(self):

153

for l in self.diff:

153

for l in self.diff:

154

yield l

154

yield l

155

156

157

class DiffProcessor(object):

157

class DiffProcessor(object):

158

"""

158

"""

159

Give it a unified or git diff and it returns a list of the files that were

159

Give it a unified or git diff and it returns a list of the files that were

160

mentioned in the diff together with a dict of meta information that

160

mentioned in the diff together with a dict of meta information that

161

can be used to render it in a HTML template.

161

can be used to render it in a HTML template.

162

"""

162

"""

163

_chunk_re = re.compile(r'^@@ -(\d+)(?:,(\d+))? \+(\d+)(?:,(\d+))? @@(.*)')

163

_chunk_re = re.compile(r'^@@ -(\d+)(?:,(\d+))? \+(\d+)(?:,(\d+))? @@(.*)')

164

_newline_marker = re.compile(r'^\\ No newline at end of file')

164

_newline_marker = re.compile(r'^\\ No newline at end of file')

165

_git_header_re = re.compile(r"""

165

_git_header_re = re.compile(r"""

166

#^diff[ ]--git

166

#^diff[ ]--git

167

[ ]a/(?P<a_path>.+?)[ ]b/(?P<b_path>.+?)\n

167

[ ]a/(?P<a_path>.+?)[ ]b/(?P<b_path>.+?)\n

168

(?:^similarity[ ]index[ ](?P<similarity_index>\d+)%\n

168

(?:^similarity[ ]index[ ](?P<similarity_index>\d+)%\n

169

^rename[ ]from[ ](?P<rename_from>\S+)\n

169

^rename[ ]from[ ](?P<rename_from>\S+)\n

170

^rename[ ]to[ ](?P<rename_to>\S+)(?:\n|$))?

170

^rename[ ]to[ ](?P<rename_to>\S+)(?:\n|$))?

171

(?:^old[ ]mode[ ](?P<old_mode>\d+)\n

171

(?:^old[ ]mode[ ](?P<old_mode>\d+)\n

172

^new[ ]mode[ ](?P<new_mode>\d+)(?:\n|$))?

172

^new[ ]mode[ ](?P<new_mode>\d+)(?:\n|$))?

173

(?:^new[ ]file[ ]mode[ ](?P<new_file_mode>.+)(?:\n|$))?

173

(?:^new[ ]file[ ]mode[ ](?P<new_file_mode>.+)(?:\n|$))?

174

(?:^deleted[ ]file[ ]mode[ ](?P<deleted_file_mode>.+)(?:\n|$))?

174

(?:^deleted[ ]file[ ]mode[ ](?P<deleted_file_mode>.+)(?:\n|$))?

175

(?:^index[ ](?P<a_blob_id>[0-9A-Fa-f]+)

175

(?:^index[ ](?P<a_blob_id>[0-9A-Fa-f]+)

176

\.\.(?P<b_blob_id>[0-9A-Fa-f]+)[ ]?(?P<b_mode>.+)?(?:\n|$))?

176

\.\.(?P<b_blob_id>[0-9A-Fa-f]+)[ ]?(?P<b_mode>.+)?(?:\n|$))?

177

(?:^---[ ](a/(?P<a_file>.+)|/dev/null)(?:\n|$))?

177

(?:^---[ ](a/(?P<a_file>.+)|/dev/null)(?:\n|$))?

178

(?:^\+\+\+[ ](b/(?P<b_file>.+)|/dev/null)(?:\n|$))?

178

(?:^\+\+\+[ ](b/(?P<b_file>.+)|/dev/null)(?:\n|$))?

179

""", re.VERBOSE | re.MULTILINE)

179

""", re.VERBOSE | re.MULTILINE)

180

_hg_header_re = re.compile(r"""

180

_hg_header_re = re.compile(r"""

181

#^diff[ ]--git

181

#^diff[ ]--git

182

[ ]a/(?P<a_path>.+?)[ ]b/(?P<b_path>.+?)\n

182

[ ]a/(?P<a_path>.+?)[ ]b/(?P<b_path>.+?)\n

183

(?:^similarity[ ]index[ ](?P<similarity_index>\d+)%(?:\n|$))?

183

(?:^similarity[ ]index[ ](?P<similarity_index>\d+)%(?:\n|$))?

184

(?:^rename[ ]from[ ](?P<rename_from>\S+)\n

184

(?:^rename[ ]from[ ](?P<rename_from>\S+)\n

185

^rename[ ]to[ ](?P<rename_to>\S+)(?:\n|$))?

185

^rename[ ]to[ ](?P<rename_to>\S+)(?:\n|$))?

186

(?:^old[ ]mode[ ](?P<old_mode>\d+)\n

186

(?:^old[ ]mode[ ](?P<old_mode>\d+)\n

187

^new[ ]mode[ ](?P<new_mode>\d+)(?:\n|$))?

187

^new[ ]mode[ ](?P<new_mode>\d+)(?:\n|$))?

188

(?:^new[ ]file[ ]mode[ ](?P<new_file_mode>.+)(?:\n|$))?

188

(?:^new[ ]file[ ]mode[ ](?P<new_file_mode>.+)(?:\n|$))?

189

(?:^deleted[ ]file[ ]mode[ ](?P<deleted_file_mode>.+)(?:\n|$))?

189

(?:^deleted[ ]file[ ]mode[ ](?P<deleted_file_mode>.+)(?:\n|$))?

190

(?:^index[ ](?P<a_blob_id>[0-9A-Fa-f]+)

190

(?:^index[ ](?P<a_blob_id>[0-9A-Fa-f]+)

191

\.\.(?P<b_blob_id>[0-9A-Fa-f]+)[ ]?(?P<b_mode>.+)?(?:\n|$))?

191

\.\.(?P<b_blob_id>[0-9A-Fa-f]+)[ ]?(?P<b_mode>.+)?(?:\n|$))?

192

(?:^---[ ](a/(?P<a_file>.+)|/dev/null)(?:\n|$))?

192

(?:^---[ ](a/(?P<a_file>.+)|/dev/null)(?:\n|$))?

193

(?:^\+\+\+[ ](b/(?P<b_file>.+)|/dev/null)(?:\n|$))?

193

(?:^\+\+\+[ ](b/(?P<b_file>.+)|/dev/null)(?:\n|$))?

194

""", re.VERBOSE | re.MULTILINE)

194

""", re.VERBOSE | re.MULTILINE)

195

196

def __init__(self, diff, vcs='hg', format='gitdiff', diff_limit=None):

196

def __init__(self, diff, vcs='hg', format='gitdiff', diff_limit=None):

197

"""

197

"""

198

:param diff: a text in diff format

198

:param diff: a text in diff format

199

:param vcs: type of version controll hg or git

199

:param vcs: type of version controll hg or git

200

:param format: format of diff passed, `udiff` or `gitdiff`

200

:param format: format of diff passed, `udiff` or `gitdiff`

201

:param diff_limit: define the size of diff that is considered "big"

201

:param diff_limit: define the size of diff that is considered "big"

202

based on that parameter cut off will be triggered, set to None

202

based on that parameter cut off will be triggered, set to None

203

to show full diff

203

to show full diff

204

"""

204

"""

205

if not isinstance(diff, basestring):

205

if not isinstance(diff, basestring):

206

raise Exception('Diff must be a basestring got %s instead' % type(diff))

206

raise Exception('Diff must be a basestring got %s instead' % type(diff))

207

208

self._diff = diff

208

self._diff = diff

209

self._format = format

209

self._format = format

210

self.adds = 0

210

self.adds = 0

211

self.removes = 0

211

self.removes = 0

212

# calculate diff size

212

# calculate diff size

213

self.diff_size = len(diff)

213

self.diff_size = len(diff)

214

self.diff_limit = diff_limit

214

self.diff_limit = diff_limit

215

self.cur_diff_size = 0

215

self.cur_diff_size = 0

216

self.parsed = False

216

self.parsed = False

217

self.parsed_diff = []

217

self.parsed_diff = []

218

self.vcs = vcs

218

self.vcs = vcs

219

220

if format == 'gitdiff':

220

if format == 'gitdiff':

221

self.differ = self._highlight_line_difflib

221

self.differ = self._highlight_line_difflib

222

self._parser = self._parse_gitdiff

222

self._parser = self._parse_gitdiff

223

else:

223

else:

224

self.differ = self._highlight_line_udiff

224

self.differ = self._highlight_line_udiff

225

self._parser = self._parse_udiff

225

self._parser = self._parse_udiff

226

227

def _copy_iterator(self):

227

def _copy_iterator(self):

228

"""

228

"""

229

make a fresh copy of generator, we should not iterate thru

229

make a fresh copy of generator, we should not iterate thru

230

an original as it's needed for repeating operations on

230

an original as it's needed for repeating operations on

231

this instance of DiffProcessor

231

this instance of DiffProcessor

232

"""

232

"""

233

self.__udiff, iterator_copy = tee(self.__udiff)

233

self.__udiff, iterator_copy = tee(self.__udiff)

234

return iterator_copy

234

return iterator_copy

235

236

def _escaper(self, string):

236

def _escaper(self, string):

237

"""

237

"""

238

Escaper for diff escapes special chars and checks the diff limit

238

Escaper for diff escapes special chars and checks the diff limit

239

240

:param string:

240

:param string:

241

:type string:

241

:type string:

242

"""

242

"""

243

244

self.cur_diff_size += len(string)

244

self.cur_diff_size += len(string)

245

246

# escaper get's iterated on each .next() call and it checks if each

246

# escaper get's iterated on each .next() call and it checks if each

247

# parsed line doesn't exceed the diff limit

247

# parsed line doesn't exceed the diff limit

248

if self.diff_limit is not None and self.cur_diff_size > self.diff_limit:

248

if self.diff_limit is not None and self.cur_diff_size > self.diff_limit:

249

raise DiffLimitExceeded('Diff Limit Exceeded')

249

raise DiffLimitExceeded('Diff Limit Exceeded')

250

251

return safe_unicode(string).replace('&', '&')\

251

return safe_unicode(string).replace('&', '&')\

252

.replace('<', '<')\

252

.replace('<', '<')\

253

.replace('>', '>')

253

.replace('>', '>')

254

255

def _line_counter(self, l):

255

def _line_counter(self, l):

256

"""

256

"""

257

Checks each line and bumps total adds/removes for this diff

257

Checks each line and bumps total adds/removes for this diff

258

259

:param l:

259

:param l:

260

"""

260

"""

261

if l.startswith('+') and not l.startswith('+++'):

261

if l.startswith('+') and not l.startswith('+++'):

262

self.adds += 1

262

self.adds += 1

263

elif l.startswith('-') and not l.startswith('---'):

263

elif l.startswith('-') and not l.startswith('---'):

264

self.removes += 1

264

self.removes += 1

265

return safe_unicode(l)

265

return safe_unicode(l)

266

267

def _highlight_line_difflib(self, line, next_):

267

def _highlight_line_difflib(self, line, next_):

268

"""

268

"""

269

Highlight inline changes in both lines.

269

Highlight inline changes in both lines.

270

"""

270

"""

271

272

if line['action'] == 'del':

272

if line['action'] == 'del':

273

old, new = line, next_

273

old, new = line, next_

274

else:

274

else:

275

old, new = next_, line

275

old, new = next_, line

276

277

oldwords = re.split(r'(\W)', old['line'])

277

oldwords = re.split(r'(\W)', old['line'])

278

newwords = re.split(r'(\W)', new['line'])

278

newwords = re.split(r'(\W)', new['line'])

279

280

sequence = difflib.SequenceMatcher(None, oldwords, newwords)

280

sequence = difflib.SequenceMatcher(None, oldwords, newwords)

281

282

oldfragments, newfragments = [], []

282

oldfragments, newfragments = [], []

283

for tag, i1, i2, j1, j2 in sequence.get_opcodes():

283

for tag, i1, i2, j1, j2 in sequence.get_opcodes():

284

oldfrag = ''.join(oldwords[i1:i2])

284

oldfrag = ''.join(oldwords[i1:i2])

285

newfrag = ''.join(newwords[j1:j2])

285

newfrag = ''.join(newwords[j1:j2])

286

if tag != 'equal':

286

if tag != 'equal':

287

if oldfrag:

287

if oldfrag:

288

oldfrag = '<del>%s</del>' % oldfrag

288

oldfrag = '<del>%s</del>' % oldfrag

289

if newfrag:

289

if newfrag:

290

newfrag = '<ins>%s</ins>' % newfrag

290

newfrag = '<ins>%s</ins>' % newfrag

291

oldfragments.append(oldfrag)

291

oldfragments.append(oldfrag)

292

newfragments.append(newfrag)

292

newfragments.append(newfrag)

293

294

old['line'] = "".join(oldfragments)

294

old['line'] = "".join(oldfragments)

295

new['line'] = "".join(newfragments)

295

new['line'] = "".join(newfragments)

296

297

def _highlight_line_udiff(self, line, next_):

297

def _highlight_line_udiff(self, line, next_):

298

"""

298

"""

299

Highlight inline changes in both lines.

299

Highlight inline changes in both lines.

300

"""

300

"""

301

start = 0

301

start = 0

302

limit = min(len(line['line']), len(next_['line']))

302

limit = min(len(line['line']), len(next_['line']))

303

while start < limit and line['line'][start] == next_['line'][start]:

303

while start < limit and line['line'][start] == next_['line'][start]:

304

start += 1

304

start += 1

305

end = -1

305

end = -1

306

limit -= start

306

limit -= start

307

while -end <= limit and line['line'][end] == next_['line'][end]:

307

while -end <= limit and line['line'][end] == next_['line'][end]:

308

end -= 1

308

end -= 1

309

end += 1

309

end += 1

310

if start or end:

310

if start or end:

311

def do(l):

311

def do(l):

312

last = end + len(l['line'])

312

last = end + len(l['line'])

313

if l['action'] == 'add':

313

if l['action'] == 'add':

314

tag = 'ins'

314

tag = 'ins'

315

else:

315

else:

316

tag = 'del'

316

tag = 'del'

317

l['line'] = '%s<%s>%s</%s>%s' % (

317

l['line'] = '%s<%s>%s</%s>%s' % (

318

l['line'][:start],

318

l['line'][:start],

319

tag,

319

tag,

320

l['line'][start:last],

320

l['line'][start:last],

321

tag,

321

tag,

322

l['line'][last:]

322

l['line'][last:]

323

)

323

)

324

do(line)

324

do(line)

325

do(next_)

325

do(next_)

326

327

def _get_header(self, diff_chunk):

327

def _get_header(self, diff_chunk):

328

"""

328

"""

329

parses the diff header, and returns parts, and leftover diff

329

parses the diff header, and returns parts, and leftover diff

330

parts consists of 14 elements::

330

parts consists of 14 elements::

331

332

a_path, b_path, similarity_index, rename_from, rename_to,

332

a_path, b_path, similarity_index, rename_from, rename_to,

333

old_mode, new_mode, new_file_mode, deleted_file_mode,

333

old_mode, new_mode, new_file_mode, deleted_file_mode,

334

a_blob_id, b_blob_id, b_mode, a_file, b_file

334

a_blob_id, b_blob_id, b_mode, a_file, b_file

335

336

:param diff_chunk:

336

:param diff_chunk:

337

:type diff_chunk:

337

:type diff_chunk:

338

"""

338

"""

339

340

if self.vcs == 'git':

340

if self.vcs == 'git':

341

match = self._git_header_re.match(diff_chunk)

341

match = self._git_header_re.match(diff_chunk)

342

diff = diff_chunk[match.end():]

342

diff = diff_chunk[match.end():]

343

return match.groupdict(), imap(self._escaper, diff.splitlines(1))

343

return match.groupdict(), imap(self._escaper, diff.splitlines(1))

344

elif self.vcs == 'hg':

344

elif self.vcs == 'hg':

345

match = self._hg_header_re.match(diff_chunk)

345

match = self._hg_header_re.match(diff_chunk)

346

diff = diff_chunk[match.end():]

346

diff = diff_chunk[match.end():]

347

return match.groupdict(), imap(self._escaper, diff.splitlines(1))

347

return match.groupdict(), imap(self._escaper, diff.splitlines(1))

348

else:

348

else:

349

raise Exception('VCS type %s is not supported' % self.vcs)

349

raise Exception('VCS type %s is not supported' % self.vcs)

350

351

def _clean_line(self, line, command):

351

def _clean_line(self, line, command):

352

if command in ['+', '-', ' ']:

352

if command in ['+', '-', ' ']:

353

#only modify the line if it's actually a diff thing

353

#only modify the line if it's actually a diff thing

354

line = line[1:]

354

line = line[1:]

355

return line

355

return line

356

357

def _parse_gitdiff(self, inline_diff=True):

357

def _parse_gitdiff(self, inline_diff=True):

358

_files = []

358

_files = []

359

diff_container = lambda arg: arg

359

diff_container = lambda arg: arg

360

361

##split the diff in chunks of separate --git a/file b/file chunks

361

##split the diff in chunks of separate --git a/file b/file chunks

362

for raw_diff in ('\n' + self._diff).split('\ndiff --git')[1:]:

362

for raw_diff in ('\n' + self._diff).split('\ndiff --git')[1:]:

363

binary = False

363

binary = False

364

binary_msg = 'unknown binary'

364

binary_msg = 'unknown binary'

365

head, diff = self._get_header(raw_diff)

365

head, diff = self._get_header(raw_diff)

366

367

if not head['a_file'] and head['b_file']:

367

if not head['a_file'] and head['b_file']:

368

op = 'A'

368

op = 'A'

369

elif head['a_file'] and head['b_file']:

369

elif head['a_file'] and head['b_file']:

370

op = 'M'

370

op = 'M'

371

elif head['a_file'] and not head['b_file']:

371

elif head['a_file'] and not head['b_file']:

372

op = 'D'

372

op = 'D'

373

else:

373

else:

374

#probably we're dealing with a binary file 1

374

#probably we're dealing with a binary file 1

375

binary = True

375

binary = True

376

if head['deleted_file_mode']:

376

if head['deleted_file_mode']:

377

op = 'D'

377

op = 'D'

378

stats = ['b', DEL_FILENODE]

378

stats = ['b', DEL_FILENODE]

379

binary_msg = 'deleted binary file'

379

binary_msg = 'deleted binary file'

380

elif head['new_file_mode']:

380

elif head['new_file_mode']:

381

op = 'A'

381

op = 'A'

382

stats = ['b', NEW_FILENODE]

382

stats = ['b', NEW_FILENODE]

383

binary_msg = 'new binary file %s' % head['new_file_mode']

383

binary_msg = 'new binary file %s' % head['new_file_mode']

384

else:

384

else:

385

if head['new_mode'] and head['old_mode']:

385

if head['new_mode'] and head['old_mode']:

386

stats = ['b', CHMOD_FILENODE]

386

stats = ['b', CHMOD_FILENODE]

387

op = 'M'

387

op = 'M'

388

binary_msg = ('modified binary file chmod %s => %s'

388

binary_msg = ('modified binary file chmod %s => %s'

389

% (head['old_mode'], head['new_mode']))

389

% (head['old_mode'], head['new_mode']))

390

elif (head['rename_from'] and head['rename_to']

390

elif (head['rename_from'] and head['rename_to']

391

and head['rename_from'] != head['rename_to']):

391

and head['rename_from'] != head['rename_to']):

392

stats = ['b', RENAMED_FILENODE]

392

stats = ['b', RENAMED_FILENODE]

393

op = 'M'

393

op = 'M'

394

binary_msg = ('file renamed from %s to %s'

394

binary_msg = ('file renamed from %s to %s'

395

% (head['rename_from'], head['rename_to']))

395

% (head['rename_from'], head['rename_to']))

396

else:

396

else:

397

stats = ['b', MOD_FILENODE]

397

stats = ['b', MOD_FILENODE]

398

op = 'M'

398

op = 'M'

399

binary_msg = 'modified binary file'

399

binary_msg = 'modified binary file'

400

401

if not binary:

401

if not binary:

402

try:

402

try:

403

chunks, stats = self._parse_lines(diff)

403

chunks, stats = self._parse_lines(diff)

404

except DiffLimitExceeded:

404

except DiffLimitExceeded:

405

diff_container = lambda _diff: LimitedDiffContainer(

405

diff_container = lambda _diff: LimitedDiffContainer(

406

self.diff_limit,

406

self.diff_limit,

407

self.cur_diff_size,

407

self.cur_diff_size,

408

_diff)

408

_diff)

409

break

409

break

410

else:

410

else:

411

chunks = []

411

chunks = []

412

chunks.append([{

412

chunks.append([{

413

'old_lineno': '',

413

'old_lineno': '',

414

'new_lineno': '',

414

'new_lineno': '',

415

'action': 'binary',

415

'action': 'binary',

416

'line': binary_msg,

416

'line': binary_msg,

417

}])

417

}])

418

419

_files.append({

419

_files.append({

420

'filename': head['b_path'],

420

'filename': head['b_path'],

421

'old_revision': head['a_blob_id'],

421

'old_revision': head['a_blob_id'],

422

'new_revision': head['b_blob_id'],

422

'new_revision': head['b_blob_id'],

423

'chunks': chunks,

423

'chunks': chunks,

424

'operation': op,

424

'operation': op,

425

'stats': stats,

425

'stats': stats,

426

})

426

})

427

428

sorter = lambda info: {'A': 0, 'M': 1, 'D': 2}.get(info['operation'])

428

sorter = lambda info: {'A': 0, 'M': 1, 'D': 2}.get(info['operation'])

429

430

if inline_diff is False:

430

if inline_diff is False:

431

return diff_container(sorted(_files, key=sorter))

431

return diff_container(sorted(_files, key=sorter))

432

433

# highlight inline changes

433

# highlight inline changes

434

for diff_data in _files:

434

for diff_data in _files:

435

for chunk in diff_data['chunks']:

435

for chunk in diff_data['chunks']:

436

lineiter = iter(chunk)

436

lineiter = iter(chunk)

437

try:

437

try:

438

while 1:

438

while 1:

439

line = lineiter.next()

439

line = lineiter.next()

440

if line['action'] not in ['unmod', 'context']:

440

if line['action'] not in ['unmod', 'context']:

441

nextline = lineiter.next()

441

nextline = lineiter.next()

442

if nextline['action'] in ['unmod', 'context'] or \

442

if nextline['action'] in ['unmod', 'context'] or \

443

nextline['action'] == line['action']:

443

nextline['action'] == line['action']:

444

continue

444

continue

445

self.differ(line, nextline)

445

self.differ(line, nextline)

446

except StopIteration:

446

except StopIteration:

447

pass

447

pass

448

449

return diff_container(sorted(_files, key=sorter))

449

return diff_container(sorted(_files, key=sorter))

450

451

def _parse_udiff(self, inline_diff=True):

451

def _parse_udiff(self, inline_diff=True):

452

raise NotImplementedError()

452

raise NotImplementedError()

453

454

def _parse_lines(self, diff):

454

def _parse_lines(self, diff):

455

"""

455

"""

456

Parse the diff an return data for the template.

456

Parse the diff an return data for the template.

457

"""

457

"""

458

459

lineiter = iter(diff)

459

lineiter = iter(diff)

460

stats = [0, 0]

460

stats = [0, 0]

461

462

try:

462

try:

463

chunks = []

463

chunks = []

464

line = lineiter.next()

464

line = lineiter.next()

465

466

while line:

466

while line:

467

lines = []

467

lines = []

468

chunks.append(lines)

468

chunks.append(lines)

469

470

match = self._chunk_re.match(line)

470

match = self._chunk_re.match(line)

471

472

if not match:

472

if not match:

473

break

473

break

474

475

gr = match.groups()

475

gr = match.groups()

476

(old_line, old_end,

476

(old_line, old_end,

477

new_line, new_end) = [int(x or 1) for x in gr[:-1]]

477

new_line, new_end) = [int(x or 1) for x in gr[:-1]]

478

old_line -= 1

478

old_line -= 1

479

new_line -= 1

479

new_line -= 1

480

481

context = len(gr) == 5

481

context = len(gr) == 5

482

old_end += old_line

482

old_end += old_line

483

new_end += new_line

483

new_end += new_line

484

485

if context:

485

if context:

486

# skip context only if it's first line

486

# skip context only if it's first line

487

if int(gr[0]) > 1:

487

if int(gr[0]) > 1:

488

lines.append({

488

lines.append({

489

'old_lineno': '...',

489

'old_lineno': '...',

490

'new_lineno': '...',

490

'new_lineno': '...',

491

'action': 'context',

491

'action': 'context',

492

'line': line,

492

'line': line,

493

})

493

})

494

495

line = lineiter.next()

495

line = lineiter.next()

496

497

while old_line < old_end or new_line < new_end:

497

while old_line < old_end or new_line < new_end:

498

command = ' '

498

command = ' '

499

if line:

499

if line:

500

command = line[0]

500

command = line[0]

501

502

affects_old = affects_new = False

502

affects_old = affects_new = False

503

504

# ignore those if we don't expect them

504

# ignore those if we don't expect them

505

if command in '#@':

505

if command in '#@':

506

continue

506

continue

507

elif command == '+':

507

elif command == '+':

508

affects_new = True

508

affects_new = True

509

action = 'add'

509

action = 'add'

510

stats[0] += 1

510

stats[0] += 1

511

elif command == '-':

511

elif command == '-':

512

affects_old = True

512

affects_old = True

513

action = 'del'

513

action = 'del'

514

stats[1] += 1

514

stats[1] += 1

515

else:

515

else:

516

affects_old = affects_new = True

516

affects_old = affects_new = True

517

action = 'unmod'

517

action = 'unmod'

518

519

if not self._newline_marker.match(line):

519

if not self._newline_marker.match(line):

520

old_line += affects_old

520

old_line += affects_old

521

new_line += affects_new

521

new_line += affects_new

522

lines.append({

522

lines.append({

523

'old_lineno': affects_old and old_line or '',

523

'old_lineno': affects_old and old_line or '',

524

'new_lineno': affects_new and new_line or '',

524

'new_lineno': affects_new and new_line or '',

525

'action': action,

525

'action': action,

526

'line': self._clean_line(line, command)

526

'line': self._clean_line(line, command)

527

})

527

})

528

529

line = lineiter.next()

529

line = lineiter.next()

530

531

if self._newline_marker.match(line):

531

if self._newline_marker.match(line):

532

# we need to append to lines, since this is not

532

# we need to append to lines, since this is not

533

# counted in the line specs of diff

533

# counted in the line specs of diff

534

lines.append({

534

lines.append({

535

'old_lineno': '...',

535

'old_lineno': '...',

536

'new_lineno': '...',

536

'new_lineno': '...',

537

'action': 'context',

537

'action': 'context',

538

'line': self._clean_line(line, command)

538

'line': self._clean_line(line, command)

539

})

539

})

540

541

except StopIteration:

541

except StopIteration:

542

pass

542

pass

543

return chunks, stats

543

return chunks, stats

544

545

def _safe_id(self, idstring):

545

def _safe_id(self, idstring):

546

"""Make a string safe for including in an id attribute.

546

"""Make a string safe for including in an id attribute.

547

548

The HTML spec says that id attributes 'must begin with

548

The HTML spec says that id attributes 'must begin with

549

a letter ([A-Za-z]) and may be followed by any number

549

a letter ([A-Za-z]) and may be followed by any number

550

of letters, digits ([0-9]), hyphens ("-"), underscores

550

of letters, digits ([0-9]), hyphens ("-"), underscores

551

("_"), colons (":"), and periods (".")'. These regexps

551

("_"), colons (":"), and periods (".")'. These regexps

552

are slightly over-zealous, in that they remove colons

552

are slightly over-zealous, in that they remove colons

553

and periods unnecessarily.

553

and periods unnecessarily.

554

555

Whitespace is transformed into underscores, and then

555

Whitespace is transformed into underscores, and then

556

anything which is not a hyphen or a character that

556

anything which is not a hyphen or a character that

557

matches \w (alphanumerics and underscore) is removed.

557

matches \w (alphanumerics and underscore) is removed.

558

559

"""

559

"""

560

# Transform all whitespace to underscore

560

# Transform all whitespace to underscore

561

idstring = re.sub(r'\s', "_", '%s' % idstring)

561

idstring = re.sub(r'\s', "_", '%s' % idstring)

562

# Remove everything that is not a hyphen or a member of \w

562

# Remove everything that is not a hyphen or a member of \w

563

idstring = re.sub(r'(?!-)\W', "", idstring).lower()

563

idstring = re.sub(r'(?!-)\W', "", idstring).lower()

564

return idstring

564

return idstring

565

566

def prepare(self, inline_diff=True):

566

def prepare(self, inline_diff=True):

567

"""

567

"""

568

Prepare the passed udiff for HTML rendering. It'l return a list

568

Prepare the passed udiff for HTML rendering. It'l return a list

569

of dicts with diff information

569

of dicts with diff information

570

"""

570

"""

571

parsed = self._parser(inline_diff=inline_diff)

571

parsed = self._parser(inline_diff=inline_diff)

572

self.parsed = True

572

self.parsed = True

573

self.parsed_diff = parsed

573

self.parsed_diff = parsed

574

return parsed

574

return parsed

575

576

def as_raw(self, diff_lines=None):

576

def as_raw(self, diff_lines=None):

577

"""

577

"""

578

Returns raw string diff

578

Returns raw string diff

579

"""

579

"""

580

return self._diff

580

return self._diff

581

#return u''.join(imap(self._line_counter, self._diff.splitlines(1)))

581

#return u''.join(imap(self._line_counter, self._diff.splitlines(1)))

582

583

def as_html(self, table_class='code-difftable', line_class='line',

583

def as_html(self, table_class='code-difftable', line_class='line',

584

new_lineno_class='lineno old', old_lineno_class='lineno new',

584

new_lineno_class='lineno old', old_lineno_class='lineno new',

585

code_class='code', enable_comments=False, parsed_lines=None):

585

code_class='code', enable_comments=False, parsed_lines=None):

586

"""

586

"""

587

Return given diff as html table with customized css classes

587

Return given diff as html table with customized css classes

588

"""

588

"""

589

def _link_to_if(condition, label, url):

589

def _link_to_if(condition, label, url):

590

"""

590

"""

591

Generates a link if condition is meet or just the label if not.

591

Generates a link if condition is meet or just the label if not.

592

"""

592

"""

593

594

if condition:

594

if condition:

595

return '''<a href="%(url)s">%(label)s</a>''' % {

595

return '''<a href="%(url)s">%(label)s</a>''' % {

596

'url': url,

596

'url': url,

597

'label': label

597

'label': label

598

}

598

}

599

else:

599

else:

600

return label

600

return label

601

if not self.parsed:

601

if not self.parsed:

602

self.prepare()

602

self.prepare()

603

604

diff_lines = self.parsed_diff

604

diff_lines = self.parsed_diff

605

if parsed_lines:

605

if parsed_lines:

606

diff_lines = parsed_lines

606

diff_lines = parsed_lines

607

608

_html_empty = True

608

_html_empty = True

609

_html = []

609

_html = []

610

_html.append('''<table class="%(table_class)s">\n''' % {

610

_html.append('''<table class="%(table_class)s">\n''' % {

611

'table_class': table_class

611

'table_class': table_class

612

})

612

})

613

614

for diff in diff_lines:

614

for diff in diff_lines:

615

for line in diff['chunks']:

615

for line in diff['chunks']:

616

_html_empty = False

616

_html_empty = False

617

for change in line:

617

for change in line:

618

_html.append('''<tr class="%(lc)s %(action)s">\n''' % {

618

_html.append('''<tr class="%(lc)s %(action)s">\n''' % {

619

'lc': line_class,

619

'lc': line_class,

620

'action': change['action']

620

'action': change['action']

621

})

621

})

622

anchor_old_id = ''

622

anchor_old_id = ''

623

anchor_new_id = ''

623

anchor_new_id = ''

624

anchor_old = "%(filename)s_o%(oldline_no)s" % {

624

anchor_old = "%(filename)s_o%(oldline_no)s" % {

625

'filename': self._safe_id(diff['filename']),

625

'filename': self._safe_id(diff['filename']),

626

'oldline_no': change['old_lineno']

626

'oldline_no': change['old_lineno']

627

}

627

}

628

anchor_new = "%(filename)s_n%(oldline_no)s" % {

628

anchor_new = "%(filename)s_n%(oldline_no)s" % {

629

'filename': self._safe_id(diff['filename']),

629

'filename': self._safe_id(diff['filename']),

630

'oldline_no': change['new_lineno']

630

'oldline_no': change['new_lineno']

631

}

631

}

632

cond_old = (change['old_lineno'] != '...' and

632

cond_old = (change['old_lineno'] != '...' and

633

change['old_lineno'])

633

change['old_lineno'])

634

cond_new = (change['new_lineno'] != '...' and

634

cond_new = (change['new_lineno'] != '...' and

635

change['new_lineno'])

635

change['new_lineno'])

636

if cond_old:

636

if cond_old:

637

anchor_old_id = 'id="%s"' % anchor_old

637

anchor_old_id = 'id="%s"' % anchor_old

638

if cond_new:

638

if cond_new:

639

anchor_new_id = 'id="%s"' % anchor_new

639

anchor_new_id = 'id="%s"' % anchor_new

640

###########################################################

640

###########################################################

641

# OLD LINE NUMBER

641

# OLD LINE NUMBER

642

###########################################################

642

###########################################################

643

_html.append('''\t<td %(a_id)s class="%(olc)s">''' % {

643

_html.append('''\t<td %(a_id)s class="%(olc)s">''' % {

644

'a_id': anchor_old_id,

644

'a_id': anchor_old_id,

645

'olc': old_lineno_class

645

'olc': old_lineno_class

646

})

646

})

647

648

_html.append('''%(link)s''' % {

648

_html.append('''%(link)s''' % {

649

'link': _link_to_if(True, change['old_lineno'],

649

'link': _link_to_if(True, change['old_lineno'],

650

'#%s' % anchor_old)

650

'#%s' % anchor_old)

651

})

651

})

652

_html.append('''</td>\n''')

652

_html.append('''</td>\n''')

653

###########################################################

653

###########################################################

654

# NEW LINE NUMBER

654

# NEW LINE NUMBER

655

###########################################################

655

###########################################################

656

657

_html.append('''\t<td %(a_id)s class="%(nlc)s">''' % {

657

_html.append('''\t<td %(a_id)s class="%(nlc)s">''' % {

658

'a_id': anchor_new_id,

658

'a_id': anchor_new_id,

659

'nlc': new_lineno_class

659

'nlc': new_lineno_class

660

})

660

})

661

662

_html.append('''%(link)s''' % {

662

_html.append('''%(link)s''' % {

663

'link': _link_to_if(True, change['new_lineno'],

663

'link': _link_to_if(True, change['new_lineno'],

664

'#%s' % anchor_new)

664

'#%s' % anchor_new)

665

})

665

})

666

_html.append('''</td>\n''')

666

_html.append('''</td>\n''')

667

###########################################################

667

###########################################################

668

# CODE

668

# CODE

669

###########################################################

669

###########################################################

670

comments = '' if enable_comments else 'no-comment'

670

comments = '' if enable_comments else 'no-comment'

671

_html.append('''\t<td class="%(cc)s %(inc)s">''' % {

671

_html.append('''\t<td class="%(cc)s %(inc)s">''' % {

672

'cc': code_class,

672

'cc': code_class,

673

'inc': comments

673

'inc': comments

674

})

674

})

675

_html.append('''\n\t\t<pre>%(code)s</pre>\n''' % {

675

_html.append('''\n\t\t<pre>%(code)s</pre>\n''' % {

676

'code': change['line']

676

'code': change['line']

677

})

677

})

678

679

_html.append('''\t</td>''')

679

_html.append('''\t</td>''')

680

_html.append('''\n</tr>\n''')

680

_html.append('''\n</tr>\n''')

681

_html.append('''</table>''')

681

_html.append('''</table>''')

682

if _html_empty:

682

if _html_empty:

683

return None

683

return None

684

return ''.join(_html)

684

return ''.join(_html)

685

686

def stat(self):

686

def stat(self):

687

"""

687

"""

688

Returns tuple of added, and removed lines for this instance

688

Returns tuple of added, and removed lines for this instance

689

"""

689

"""

690

return self.adds, self.removes

690

return self.adds, self.removes

691

692

693

class InMemoryBundleRepo(bundlerepository):

693

class InMemoryBundleRepo(bundlerepository):

694

def __init__(self, ui, path, bundlestream):

694

def __init__(self, ui, path, bundlestream):

695

self._tempparent = None

695

self._tempparent = None

696

localrepo.localrepository.__init__(self, ui, path)

696

localrepo.localrepository.__init__(self, ui, path)

697

self.ui.setconfig('phases', 'publish', False)

697

self.ui.setconfig('phases', 'publish', False)

698

699

self.bundle = bundlestream

699

self.bundle = bundlestream

700

701

# dict with the mapping 'filename' -> position in the bundle

701

# dict with the mapping 'filename' -> position in the bundle

702

self.bundlefilespos = {}

702

self.bundlefilespos = {}

703

704

705

def differ(org_repo, org_ref, other_repo, other_ref, discovery_data=None,

705

def differ(org_repo, org_ref, other_repo, other_ref, discovery_data=None,

706

remote_compare=False, context=3, ignore_whitespace=False):

706

remote_compare=False, context=3, ignore_whitespace=False):

707

"""

707

"""

708

General differ between branches, bookmarks, revisions of two remote or

708

General differ between branches, bookmarks, revisions of two remote or

709

local but related repositories

709

local but related repositories

710

711

:param org_repo:

711

:param org_repo:

712

:param org_ref:

712

:param org_ref:

713

:param other_repo:

713

:param other_repo:

714

:type other_repo:

714

:type other_repo:

715

:type other_ref:

715

:type other_ref:

716

"""

716

"""

717

718

org_repo_scm = org_repo.scm_instance

718

org_repo_scm = org_repo.scm_instance

719

other_repo_scm = other_repo.scm_instance

719

other_repo_scm = other_repo.scm_instance

720

721

org_repo = org_repo_scm._repo

721

org_repo = org_repo_scm._repo

722

other_repo = other_repo_scm._repo

722

other_repo = other_repo_scm._repo

723

724

org_ref = org_ref[1]

724

org_ref = org_ref[1]

725

other_ref = other_ref[1]

725

other_ref = other_ref[1]

726

727

if org_repo == other_repo:

727

if org_repo_scm == other_repo_scm:

728

log.debug('running diff between %s@%s and %s@%s'

728

log.debug('running diff between %s@%s and %s@%s'

729

% (org_repo.path, org_ref, other_repo.path, other_ref))

729

% (org_repo.path, org_ref, other_repo.path, other_ref))

730

_diff = org_repo_scm.get_diff(rev1=org_ref, rev2=other_ref,

730

_diff = org_repo_scm.get_diff(rev1=org_ref, rev2=other_ref,

731

ignore_whitespace=ignore_whitespace, context=context)

731

ignore_whitespace=ignore_whitespace, context=context)

732

return _diff

732

return _diff

733

734

elif remote_compare:

734

elif remote_compare:

735

opts = diffopts(git=True, ignorews=ignore_whitespace, context=context)

735

opts = diffopts(git=True, ignorews=ignore_whitespace, context=context)

736

common, incoming, rheads = discovery_data

736

common, incoming, rheads = discovery_data

737

org_repo_peer = localrepo.locallegacypeer(org_repo.local())

737

org_repo_peer = localrepo.locallegacypeer(org_repo.local())

738

# create a bundle (uncompressed if other repo is not local)

738

# create a bundle (uncompressed if other repo is not local)

739

if org_repo_peer.capable('getbundle'):

739

if org_repo_peer.capable('getbundle'):

740

# disable repo hooks here since it's just bundle !

740

# disable repo hooks here since it's just bundle !

741

# patch and reset hooks section of UI config to not run any

741

# patch and reset hooks section of UI config to not run any

742

# hooks on fetching archives with subrepos

742

# hooks on fetching archives with subrepos

743

for k, _ in org_repo.ui.configitems('hooks'):

743

for k, _ in org_repo.ui.configitems('hooks'):

744

org_repo.ui.setconfig('hooks', k, None)

744

org_repo.ui.setconfig('hooks', k, None)

745

unbundle = org_repo.getbundle('incoming', common=None,

745

unbundle = org_repo.getbundle('incoming', common=None,

746

heads=None)

746

heads=None)

747

748

buf = BytesIO()

748

buf = BytesIO()

749

while True:

749

while True:

750

chunk = unbundle._stream.read(1024 * 4)

750

chunk = unbundle._stream.read(1024 * 4)

751

if not chunk:

751

if not chunk:

752

break

752

break

753

buf.write(chunk)

753

buf.write(chunk)

754

755

buf.seek(0)

755

buf.seek(0)

756

# replace chunked _stream with data that can do tell() and seek()

756

# replace chunked _stream with data that can do tell() and seek()

757

unbundle._stream = buf

757

unbundle._stream = buf

758

759

ui = make_ui('db')

759

ui = make_ui('db')

760

bundlerepo = InMemoryBundleRepo(ui, path=org_repo.root,

760

bundlerepo = InMemoryBundleRepo(ui, path=org_repo.root,

761

bundlestream=unbundle)

761

bundlestream=unbundle)

762

763

return ''.join(patch.diff(bundlerepo,

763

return ''.join(patch.diff(bundlerepo,

764

node1=other_repo[other_ref].node(),

764

node1=other_repo[other_ref].node(),

765

node2=org_repo[org_ref].node(),

765

node2=org_repo[org_ref].node(),

766

opts=opts))

766

opts=opts))

767

768

return ''

768

return ''

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # -*- coding: utf-8 -*-
             """
                 rhodecode.lib.diffs
                 ~~~~~~~~~~~~~~~~~~~
                 Set of diffing helpers, previously part of vcs
                 :created_on: Dec 4, 2011
                 :author: marcink
                 :copyright: (C) 2010-2012 Marcin Kuzminski <marcin@python-works.com>
                 :original copyright: 2007-2008 by Armin Ronacher
                 :license: GPLv3, see COPYING for more details.
             """
             # This program is free software: you can redistribute it and/or modify
             # it under the terms of the GNU General Public License as published by
             # the Free Software Foundation, either version 3 of the License, or
             # (at your option) any later version.
             #
             # This program is distributed in the hope that it will be useful,
             # but WITHOUT ANY WARRANTY; without even the implied warranty of
             # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
             # GNU General Public License for more details.
             #
             # You should have received a copy of the GNU General Public License
             # along with this program.  If not, see <http://www.gnu.org/licenses/>.
             import re
             import difflib
             import logging
             import traceback
             from itertools import tee, imap
             from mercurial import patch
             from mercurial.mdiff import diffopts
             from mercurial.bundlerepo import bundlerepository
             from pylons.i18n.translation import _
             from rhodecode.lib.compat import BytesIO
             from rhodecode.lib.vcs.utils.hgcompat import localrepo
             from rhodecode.lib.vcs.exceptions import VCSError
             from rhodecode.lib.vcs.nodes import FileNode, SubModuleNode
             from rhodecode.lib.vcs.backends.base import EmptyChangeset
             from rhodecode.lib.helpers import escape
             from rhodecode.lib.utils import make_ui
             from rhodecode.lib.utils2 import safe_unicode
             log = logging.getLogger(__name__)
             def wrap_to_table(str_):
                 return '''<table class="code-difftable">
                             <tr class="line no-comment">
                             <td class="lineno new"></td>
                             <td class="code no-comment"><pre>%s</pre></td>
                             </tr>
                           </table>''' % str_
             def wrapped_diff(filenode_old, filenode_new, cut_off_limit=None,
                             ignore_whitespace=True, line_context=3,
                             enable_comments=False):
                 """
                 returns a wrapped diff into a table, checks for cut_off_limit and presents
                 proper message
                 """
                 if filenode_old is None:
                     filenode_old = FileNode(filenode_new.path, '', EmptyChangeset())
                 if filenode_old.is_binary or filenode_new.is_binary:
                     diff = wrap_to_table(_('binary file'))
                     stats = (0, 0)
                     size = 0
                 elif cut_off_limit != -1 and (cut_off_limit is None or
                 (filenode_old.size < cut_off_limit and filenode_new.size < cut_off_limit)):
                     f_gitdiff = get_gitdiff(filenode_old, filenode_new,
                                             ignore_whitespace=ignore_whitespace,
                                             context=line_context)
                     diff_processor = DiffProcessor(f_gitdiff, format='gitdiff')
                     diff = diff_processor.as_html(enable_comments=enable_comments)
                     stats = diff_processor.stat()
                     size = len(diff or '')
                 else:
                     diff = wrap_to_table(_('Changeset was too big and was cut off, use '
                                            'diff menu to display this diff'))
                     stats = (0, 0)
                     size = 0
                 if not diff:
                     submodules = filter(lambda o: isinstance(o, SubModuleNode),
                                         [filenode_new, filenode_old])
                     if submodules:
                         diff = wrap_to_table(escape('Submodule %r' % submodules[0]))
                     else:
                         diff = wrap_to_table(_('No changes detected'))
                 cs1 = filenode_old.changeset.raw_id
                 cs2 = filenode_new.changeset.raw_id
                 return size, cs1, cs2, diff, stats
             def get_gitdiff(filenode_old, filenode_new, ignore_whitespace=True, context=3):
                 """
                 Returns git style diff between given ``filenode_old`` and ``filenode_new``.
                 :param ignore_whitespace: ignore whitespaces in diff
                 """
                 # make sure we pass in default context
                 context = context or 3
                 submodules = filter(lambda o: isinstance(o, SubModuleNode),
                                     [filenode_new, filenode_old])
                 if submodules:
                     return ''
                 for filenode in (filenode_old, filenode_new):
                     if not isinstance(filenode, FileNode):
                         raise VCSError("Given object should be FileNode object, not %s"
                             % filenode.__class__)
                 repo = filenode_new.changeset.repository
                 old_raw_id = getattr(filenode_old.changeset, 'raw_id', repo.EMPTY_CHANGESET)
                 new_raw_id = getattr(filenode_new.changeset, 'raw_id', repo.EMPTY_CHANGESET)
                 vcs_gitdiff = repo.get_diff(old_raw_id, new_raw_id, filenode_new.path,
                                             ignore_whitespace, context)
                 return vcs_gitdiff
             NEW_FILENODE = 1
             DEL_FILENODE = 2
             MOD_FILENODE = 3
             RENAMED_FILENODE = 4
             CHMOD_FILENODE = 5
             class DiffLimitExceeded(Exception):
                 pass
             class LimitedDiffContainer(object):
                 def __init__(self, diff_limit, cur_diff_size, diff):
                     self.diff = diff
                     self.diff_limit = diff_limit
                     self.cur_diff_size = cur_diff_size
                 def __iter__(self):
                     for l in self.diff:
                         yield l
             class DiffProcessor(object):
                 """
                 Give it a unified or git diff and it returns a list of the files that were
                 mentioned in the diff together with a dict of meta information that
                 can be used to render it in a HTML template.
                 """
                 _chunk_re = re.compile(r'^@@ -(\d+)(?:,(\d+))? \+(\d+)(?:,(\d+))? @@(.*)')
                 _newline_marker = re.compile(r'^\\ No newline at end of file')
                 _git_header_re = re.compile(r"""
                     #^diff[ ]--git
                         [ ]a/(?P<a_path>.+?)[ ]b/(?P<b_path>.+?)\n
                     (?:^similarity[ ]index[ ](?P<similarity_index>\d+)%\n
                        ^rename[ ]from[ ](?P<rename_from>\S+)\n
                        ^rename[ ]to[ ](?P<rename_to>\S+)(?:\n|$))?
                     (?:^old[ ]mode[ ](?P<old_mode>\d+)\n
                        ^new[ ]mode[ ](?P<new_mode>\d+)(?:\n|$))?
                     (?:^new[ ]file[ ]mode[ ](?P<new_file_mode>.+)(?:\n|$))?
                     (?:^deleted[ ]file[ ]mode[ ](?P<deleted_file_mode>.+)(?:\n|$))?
                     (?:^index[ ](?P<a_blob_id>[0-9A-Fa-f]+)
                         \.\.(?P<b_blob_id>[0-9A-Fa-f]+)[ ]?(?P<b_mode>.+)?(?:\n|$))?
                     (?:^---[ ](a/(?P<a_file>.+)|/dev/null)(?:\n|$))?
                     (?:^\+\+\+[ ](b/(?P<b_file>.+)|/dev/null)(?:\n|$))?
                 """, re.VERBOSE | re.MULTILINE)
                 _hg_header_re = re.compile(r"""
                     #^diff[ ]--git
                         [ ]a/(?P<a_path>.+?)[ ]b/(?P<b_path>.+?)\n
                     (?:^similarity[ ]index[ ](?P<similarity_index>\d+)%(?:\n|$))?
                     (?:^rename[ ]from[ ](?P<rename_from>\S+)\n
                        ^rename[ ]to[ ](?P<rename_to>\S+)(?:\n|$))?
                     (?:^old[ ]mode[ ](?P<old_mode>\d+)\n
                        ^new[ ]mode[ ](?P<new_mode>\d+)(?:\n|$))?
                     (?:^new[ ]file[ ]mode[ ](?P<new_file_mode>.+)(?:\n|$))?
                     (?:^deleted[ ]file[ ]mode[ ](?P<deleted_file_mode>.+)(?:\n|$))?
                     (?:^index[ ](?P<a_blob_id>[0-9A-Fa-f]+)
                         \.\.(?P<b_blob_id>[0-9A-Fa-f]+)[ ]?(?P<b_mode>.+)?(?:\n|$))?
                     (?:^---[ ](a/(?P<a_file>.+)|/dev/null)(?:\n|$))?
                     (?:^\+\+\+[ ](b/(?P<b_file>.+)|/dev/null)(?:\n|$))?
                 """, re.VERBOSE | re.MULTILINE)
                 def __init__(self, diff, vcs='hg', format='gitdiff', diff_limit=None):
                     """
                     :param diff:   a text in diff format
                     :param vcs: type of version controll hg or git
                     :param format: format of diff passed, `udiff` or `gitdiff`
                     :param diff_limit: define the size of diff that is considered "big"
                         based on that parameter cut off will be triggered, set to None
                         to show full diff
                     """
                     if not isinstance(diff, basestring):
                         raise Exception('Diff must be a basestring got %s instead' % type(diff))
                     self._diff = diff
                     self._format = format
                     self.adds = 0
                     self.removes = 0
                     # calculate diff size
                     self.diff_size = len(diff)
                     self.diff_limit = diff_limit
                     self.cur_diff_size = 0
                     self.parsed = False
                     self.parsed_diff = []
                     self.vcs = vcs
                     if format == 'gitdiff':
                         self.differ = self._highlight_line_difflib
                         self._parser = self._parse_gitdiff
                     else:
                         self.differ = self._highlight_line_udiff
                         self._parser = self._parse_udiff
                 def _copy_iterator(self):
                     """
                     make a fresh copy of generator, we should not iterate thru
                     an original as it's needed for repeating operations on
                     this instance of DiffProcessor
                     """
                     self.__udiff, iterator_copy = tee(self.__udiff)
                     return iterator_copy
                 def _escaper(self, string):
                     """
                     Escaper for diff escapes special chars and checks the diff limit
                     :param string:
                     :type string:
                     """
                     self.cur_diff_size += len(string)
                     # escaper get's iterated on each .next() call and it checks if each
                     # parsed line doesn't exceed the diff limit
                     if self.diff_limit is not None and self.cur_diff_size > self.diff_limit:
                         raise DiffLimitExceeded('Diff Limit Exceeded')
                     return safe_unicode(string).replace('&', '&amp;')\
                             .replace('<', '&lt;')\
                             .replace('>', '&gt;')
                 def _line_counter(self, l):
                     """
                     Checks each line and bumps total adds/removes for this diff
                     :param l:
                     """
                     if l.startswith('+') and not l.startswith('+++'):
                         self.adds += 1
                     elif l.startswith('-') and not l.startswith('---'):
                         self.removes += 1
                     return safe_unicode(l)
                 def _highlight_line_difflib(self, line, next_):
                     """
                     Highlight inline changes in both lines.
                     """
                     if line['action'] == 'del':
                         old, new = line, next_
                     else:
                         old, new = next_, line
                     oldwords = re.split(r'(\W)', old['line'])
                     newwords = re.split(r'(\W)', new['line'])
                     sequence = difflib.SequenceMatcher(None, oldwords, newwords)
                     oldfragments, newfragments = [], []
                     for tag, i1, i2, j1, j2 in sequence.get_opcodes():
                         oldfrag = ''.join(oldwords[i1:i2])
                         newfrag = ''.join(newwords[j1:j2])
                         if tag != 'equal':
                             if oldfrag:
                                 oldfrag = '<del>%s</del>' % oldfrag
                             if newfrag:
                                 newfrag = '<ins>%s</ins>' % newfrag
                         oldfragments.append(oldfrag)
                         newfragments.append(newfrag)
                     old['line'] = "".join(oldfragments)
                     new['line'] = "".join(newfragments)
                 def _highlight_line_udiff(self, line, next_):
                     """
                     Highlight inline changes in both lines.
                     """
                     start = 0
                     limit = min(len(line['line']), len(next_['line']))
                     while start < limit and line['line'][start] == next_['line'][start]:
                         start += 1
                     end = -1
                     limit -= start
                     while -end <= limit and line['line'][end] == next_['line'][end]:
                         end -= 1
                     end += 1
                     if start or end:
                         def do(l):
                             last = end + len(l['line'])
                             if l['action'] == 'add':
                                 tag = 'ins'
                             else:
                                 tag = 'del'
                             l['line'] = '%s<%s>%s</%s>%s' % (
                                 l['line'][:start],
                                 tag,
                                 l['line'][start:last],
                                 tag,
                                 l['line'][last:]
                             )
                         do(line)
                         do(next_)
                 def _get_header(self, diff_chunk):
                     """
                     parses the diff header, and returns parts, and leftover diff
                     parts consists of 14 elements::
                         a_path, b_path, similarity_index, rename_from, rename_to,
                         old_mode, new_mode, new_file_mode, deleted_file_mode,
                         a_blob_id, b_blob_id, b_mode, a_file, b_file
                     :param diff_chunk:
                     :type diff_chunk:
                     """
                     if self.vcs == 'git':
                         match = self._git_header_re.match(diff_chunk)
                         diff = diff_chunk[match.end():]
                         return match.groupdict(), imap(self._escaper, diff.splitlines(1))
                     elif self.vcs == 'hg':
                         match = self._hg_header_re.match(diff_chunk)
                         diff = diff_chunk[match.end():]
                         return match.groupdict(), imap(self._escaper, diff.splitlines(1))
                     else:
                         raise Exception('VCS type %s is not supported' % self.vcs)
                 def _clean_line(self, line, command):
                     if command in ['+', '-', ' ']:
                         #only modify the line if it's actually a diff thing
                         line = line[1:]
                     return line
                 def _parse_gitdiff(self, inline_diff=True):
                     _files = []
                     diff_container = lambda arg: arg
                     ##split the diff in chunks of separate --git a/file b/file chunks
                     for raw_diff in ('\n' + self._diff).split('\ndiff --git')[1:]:
                         binary = False
                         binary_msg = 'unknown binary'
                         head, diff = self._get_header(raw_diff)
                         if not head['a_file'] and head['b_file']:
                             op = 'A'
                         elif head['a_file'] and head['b_file']:
                             op = 'M'
                         elif head['a_file'] and not head['b_file']:
                             op = 'D'
                         else:
                             #probably we're dealing with a binary file 1
                             binary = True
                             if head['deleted_file_mode']:
                                 op = 'D'
                                 stats = ['b', DEL_FILENODE]
                                 binary_msg = 'deleted binary file'
                             elif head['new_file_mode']:
                                 op = 'A'
                                 stats = ['b', NEW_FILENODE]
                                 binary_msg = 'new binary file %s' % head['new_file_mode']
                             else:
                                 if head['new_mode'] and head['old_mode']:
                                     stats = ['b', CHMOD_FILENODE]
                                     op = 'M'
                                     binary_msg = ('modified binary file chmod %s => %s'
                                                   % (head['old_mode'], head['new_mode']))
                                 elif (head['rename_from'] and head['rename_to']
                                       and head['rename_from'] != head['rename_to']):
                                     stats = ['b', RENAMED_FILENODE]
                                     op = 'M'
                                     binary_msg = ('file renamed from %s to %s'
                                                   % (head['rename_from'], head['rename_to']))
                                 else:
                                     stats = ['b', MOD_FILENODE]
                                     op = 'M'
                                     binary_msg = 'modified binary file'
                         if not binary:
                             try:
                                 chunks, stats = self._parse_lines(diff)
                             except DiffLimitExceeded:
                                 diff_container = lambda _diff: LimitedDiffContainer(
                                                             self.diff_limit,
                                                             self.cur_diff_size,
                                                             _diff)
                                 break
                         else:
                             chunks = []
                             chunks.append([{
                                 'old_lineno': '',
                                 'new_lineno': '',
                                 'action':     'binary',
                                 'line':       binary_msg,
                             }])
                         _files.append({
                             'filename':         head['b_path'],
                             'old_revision':     head['a_blob_id'],
                             'new_revision':     head['b_blob_id'],
                             'chunks':           chunks,
                             'operation':        op,
                             'stats':            stats,
                         })
                     sorter = lambda info: {'A': 0, 'M': 1, 'D': 2}.get(info['operation'])
                     if inline_diff is False:
                         return diff_container(sorted(_files, key=sorter))
                     # highlight inline changes
                     for diff_data in _files:
                         for chunk in diff_data['chunks']:
                             lineiter = iter(chunk)
                             try:
                                 while 1:
                                     line = lineiter.next()
                                     if line['action'] not in ['unmod', 'context']:
                                         nextline = lineiter.next()
                                         if nextline['action'] in ['unmod', 'context'] or \
                                            nextline['action'] == line['action']:
                                             continue
                                         self.differ(line, nextline)
                             except StopIteration:
                                 pass
                     return diff_container(sorted(_files, key=sorter))
                 def _parse_udiff(self, inline_diff=True):
                     raise NotImplementedError()
                 def _parse_lines(self, diff):
                     """
                     Parse the diff an return data for the template.
                     """
                     lineiter = iter(diff)
                     stats = [0, 0]
                     try:
                         chunks = []
                         line = lineiter.next()
                         while line:
                             lines = []
                             chunks.append(lines)
                             match = self._chunk_re.match(line)
                             if not match:
                                 break
                             gr = match.groups()
                             (old_line, old_end,
                              new_line, new_end) = [int(x or 1) for x in gr[:-1]]
                             old_line -= 1
                             new_line -= 1
                             context = len(gr) == 5
                             old_end += old_line
                             new_end += new_line
                             if context:
                                 # skip context only if it's first line
                                 if int(gr[0]) > 1:
                                     lines.append({
                                         'old_lineno': '...',
                                         'new_lineno': '...',
                                         'action':     'context',
                                         'line':       line,
                                     })
                             line = lineiter.next()
                             while old_line < old_end or new_line < new_end:
                                 command = ' '
                                 if line:
                                     command = line[0]
                                 affects_old = affects_new = False
                                 # ignore those if we don't expect them
                                 if command in '#@':
                                     continue
                                 elif command == '+':
                                     affects_new = True
                                     action = 'add'
                                     stats[0] += 1
                                 elif command == '-':
                                     affects_old = True
                                     action = 'del'
                                     stats[1] += 1
                                 else:
                                     affects_old = affects_new = True
                                     action = 'unmod'
                                 if not self._newline_marker.match(line):
                                     old_line += affects_old
                                     new_line += affects_new
                                     lines.append({
                                         'old_lineno':   affects_old and old_line or '',
                                         'new_lineno':   affects_new and new_line or '',
                                         'action':       action,
                                         'line':         self._clean_line(line, command)
                                     })
                                 line = lineiter.next()
                                 if self._newline_marker.match(line):
                                     # we need to append to lines, since this is not
                                     # counted in the line specs of diff
                                     lines.append({
                                         'old_lineno':   '...',
                                         'new_lineno':   '...',
                                         'action':       'context',
                                         'line':         self._clean_line(line, command)
                                     })
                     except StopIteration:
                         pass
                     return chunks, stats
                 def _safe_id(self, idstring):
                     """Make a string safe for including in an id attribute.
                     The HTML spec says that id attributes 'must begin with
                     a letter ([A-Za-z]) and may be followed by any number
                     of letters, digits ([0-9]), hyphens ("-"), underscores
                     ("_"), colons (":"), and periods (".")'. These regexps
                     are slightly over-zealous, in that they remove colons
                     and periods unnecessarily.
                     Whitespace is transformed into underscores, and then
                     anything which is not a hyphen or a character that
                     matches \w (alphanumerics and underscore) is removed.
                     """
                     # Transform all whitespace to underscore
                     idstring = re.sub(r'\s', "_", '%s' % idstring)
                     # Remove everything that is not a hyphen or a member of \w
                     idstring = re.sub(r'(?!-)\W', "", idstring).lower()
                     return idstring
                 def prepare(self, inline_diff=True):
                     """
                     Prepare the passed udiff for HTML rendering. It'l return a list
                     of dicts with diff information
                     """
                     parsed = self._parser(inline_diff=inline_diff)
                     self.parsed = True
                     self.parsed_diff = parsed
                     return parsed
                 def as_raw(self, diff_lines=None):
                     """
                     Returns raw string diff
                     """
                     return self._diff
                     #return u''.join(imap(self._line_counter, self._diff.splitlines(1)))
                 def as_html(self, table_class='code-difftable', line_class='line',
                             new_lineno_class='lineno old', old_lineno_class='lineno new',
                             code_class='code', enable_comments=False, parsed_lines=None):
                     """
                     Return given diff as html table with customized css classes
                     """
                     def _link_to_if(condition, label, url):
                         """
                         Generates a link if condition is meet or just the label if not.
                         """
                         if condition:
                             return '''<a href="%(url)s">%(label)s</a>''' % {
                                 'url': url,
                                 'label': label
                             }
                         else:
                             return label
                     if not self.parsed:
                         self.prepare()
                     diff_lines = self.parsed_diff
                     if parsed_lines:
                         diff_lines = parsed_lines
                     _html_empty = True
                     _html = []
                     _html.append('''<table class="%(table_class)s">\n''' % {
                         'table_class': table_class
                     })
                     for diff in diff_lines:
                         for line in diff['chunks']:
                             _html_empty = False
                             for change in line:
                                 _html.append('''<tr class="%(lc)s %(action)s">\n''' % {
                                     'lc': line_class,
                                     'action': change['action']
                                 })
                                 anchor_old_id = ''
                                 anchor_new_id = ''
                                 anchor_old = "%(filename)s_o%(oldline_no)s" % {
                                     'filename': self._safe_id(diff['filename']),
                                     'oldline_no': change['old_lineno']
                                 }
                                 anchor_new = "%(filename)s_n%(oldline_no)s" % {
                                     'filename': self._safe_id(diff['filename']),
                                     'oldline_no': change['new_lineno']
                                 }
                                 cond_old = (change['old_lineno'] != '...' and
                                             change['old_lineno'])
                                 cond_new = (change['new_lineno'] != '...' and
                                             change['new_lineno'])
                                 if cond_old:
                                     anchor_old_id = 'id="%s"' % anchor_old
                                 if cond_new:
                                     anchor_new_id = 'id="%s"' % anchor_new
                                 ###########################################################
                                 # OLD LINE NUMBER
                                 ###########################################################
                                 _html.append('''\t<td %(a_id)s class="%(olc)s">''' % {
                                     'a_id': anchor_old_id,
                                     'olc': old_lineno_class
                                 })
                                 _html.append('''%(link)s''' % {
                                     'link': _link_to_if(True, change['old_lineno'],
                                                         '#%s' % anchor_old)
                                 })
                                 _html.append('''</td>\n''')
                                 ###########################################################
                                 # NEW LINE NUMBER
                                 ###########################################################
                                 _html.append('''\t<td %(a_id)s class="%(nlc)s">''' % {
                                     'a_id': anchor_new_id,
                                     'nlc': new_lineno_class
                                 })
                                 _html.append('''%(link)s''' % {
                                     'link': _link_to_if(True, change['new_lineno'],
                                                         '#%s' % anchor_new)
                                 })
                                 _html.append('''</td>\n''')
                                 ###########################################################
                                 # CODE
                                 ###########################################################
                                 comments = '' if enable_comments else 'no-comment'
                                 _html.append('''\t<td class="%(cc)s %(inc)s">''' % {
                                     'cc': code_class,
                                     'inc': comments
                                 })
                                 _html.append('''\n\t\t<pre>%(code)s</pre>\n''' % {
                                     'code': change['line']
                                 })
                                 _html.append('''\t</td>''')
                                 _html.append('''\n</tr>\n''')
                     _html.append('''</table>''')
                     if _html_empty:
                         return None
                     return ''.join(_html)
                 def stat(self):
                     """
                     Returns tuple of added, and removed lines for this instance
                     """
                     return self.adds, self.removes
             class InMemoryBundleRepo(bundlerepository):
                 def __init__(self, ui, path, bundlestream):
                     self._tempparent = None
                     localrepo.localrepository.__init__(self, ui, path)
                     self.ui.setconfig('phases', 'publish', False)
                     self.bundle = bundlestream
                     # dict with the mapping 'filename' -> position in the bundle
                     self.bundlefilespos = {}
             def differ(org_repo, org_ref, other_repo, other_ref, discovery_data=None,
                        remote_compare=False, context=3, ignore_whitespace=False):
                 """
                 General differ between branches, bookmarks, revisions of two remote or
                 local but related repositories
                 :param org_repo:
                 :param org_ref:
                 :param other_repo:
                 :type other_repo:
                 :type other_ref:
                 """
                 org_repo_scm = org_repo.scm_instance
                 other_repo_scm = other_repo.scm_instance
                 org_repo = org_repo_scm._repo
                 other_repo = other_repo_scm._repo
                 org_ref = org_ref[1]
                 other_ref = other_ref[1]
-                if org_repo == other_repo:
+                if org_repo_scm == other_repo_scm:
                     log.debug('running diff between %s@%s and %s@%s'
                               % (org_repo.path, org_ref, other_repo.path, other_ref))
                     _diff = org_repo_scm.get_diff(rev1=org_ref, rev2=other_ref,
                         ignore_whitespace=ignore_whitespace, context=context)
                     return _diff
                 elif remote_compare:
                     opts = diffopts(git=True, ignorews=ignore_whitespace, context=context)
                     common, incoming, rheads = discovery_data
                     org_repo_peer = localrepo.locallegacypeer(org_repo.local())
                     # create a bundle (uncompressed if other repo is not local)
                     if org_repo_peer.capable('getbundle'):
                         # disable repo hooks here since it's just bundle !
                         # patch and reset hooks section of UI config to not run any
                         # hooks on fetching archives with subrepos
                         for k, _ in org_repo.ui.configitems('hooks'):
                             org_repo.ui.setconfig('hooks', k, None)
                         unbundle = org_repo.getbundle('incoming', common=None,
                                                       heads=None)
                         buf = BytesIO()
                         while True:
                             chunk = unbundle._stream.read(1024 * 4)
                             if not chunk:
                                 break
                             buf.write(chunk)
                         buf.seek(0)
                         # replace chunked _stream with data that can do tell() and seek()
                         unbundle._stream = buf
                         ui = make_ui('db')
                         bundlerepo = InMemoryBundleRepo(ui, path=org_repo.root,
                                                         bundlestream=unbundle)
                         return ''.join(patch.diff(bundlerepo,
                                                   node1=other_repo[other_ref].node(),
                                                   node2=org_repo[org_ref].node(),
                                                   opts=opts))
                 return ''