upstream/mercurial-mirror Commit - r7950:9bbcfa89

1

#

1

#

2

# Mercurial built-in replacement for cvsps.

2

# Mercurial built-in replacement for cvsps.

3

#

3

#

4

5

#

5

#

6

# This software may be used and distributed according to the terms

6

# This software may be used and distributed according to the terms

7

# of the GNU General Public License, incorporated herein by reference.

7

# of the GNU General Public License, incorporated herein by reference.

8

9

import os

9

import os

10

import re

10

import re

11

import cPickle as pickle

11

import cPickle as pickle

12

from mercurial import util

12

from mercurial import util

13

from mercurial.i18n import _

13

from mercurial.i18n import _

14

15

def listsort(list, key):

15

def listsort(list, key):

16

"helper to sort by key in Python 2.3"

16

"helper to sort by key in Python 2.3"

17

try:

17

try:

18

list.sort(key=key)

18

list.sort(key=key)

19

except TypeError:

19

except TypeError:

20

list.sort(lambda l, r: cmp(key(l), key(r)))

20

list.sort(lambda l, r: cmp(key(l), key(r)))

21

22

class logentry(object):

22

class logentry(object):

23

'''Class logentry has the following attributes:

23

'''Class logentry has the following attributes:

24

.author - author name as CVS knows it

24

.author - author name as CVS knows it

25

.branch - name of branch this revision is on

25

.branch - name of branch this revision is on

26

.branches - revision tuple of branches starting at this revision

26

.branches - revision tuple of branches starting at this revision

27

.comment - commit message

27

.comment - commit message

28

.date - the commit date as a (time, tz) tuple

28

.date - the commit date as a (time, tz) tuple

29

.dead - true if file revision is dead

29

.dead - true if file revision is dead

30

.file - Name of file

30

.file - Name of file

31

.lines - a tuple (+lines, -lines) or None

31

.lines - a tuple (+lines, -lines) or None

32

.parent - Previous revision of this entry

32

.parent - Previous revision of this entry

33

.rcs - name of file as returned from CVS

33

.rcs - name of file as returned from CVS

34

.revision - revision number as tuple

34

.revision - revision number as tuple

35

.tags - list of tags on the file

35

.tags - list of tags on the file

36

.synthetic - is this a synthetic "file ... added on ..." revision?

36

.synthetic - is this a synthetic "file ... added on ..." revision?

37

'''

37

'''

38

def __init__(self, **entries):

38

def __init__(self, **entries):

39

self.__dict__.update(entries)

39

self.__dict__.update(entries)

40

41

class logerror(Exception):

41

class logerror(Exception):

42

pass

42

pass

43

44

def getrepopath(cvspath):

44

def getrepopath(cvspath):

45

"""Return the repository path from a CVS path.

45

"""Return the repository path from a CVS path.

46

47

>>> getrepopath('/foo/bar')

47

>>> getrepopath('/foo/bar')

48

'/foo/bar'

48

'/foo/bar'

49

>>> getrepopath('c:/foo/bar')

49

>>> getrepopath('c:/foo/bar')

50

'c:/foo/bar'

50

'c:/foo/bar'

51

>>> getrepopath(':pserver:10/foo/bar')

51

>>> getrepopath(':pserver:10/foo/bar')

52

'/foo/bar'

52

'/foo/bar'

53

>>> getrepopath(':pserver:10c:/foo/bar')

53

>>> getrepopath(':pserver:10c:/foo/bar')

54

'/foo/bar'

54

'/foo/bar'

55

>>> getrepopath(':pserver:/foo/bar')

55

>>> getrepopath(':pserver:/foo/bar')

56

'/foo/bar'

56

'/foo/bar'

57

>>> getrepopath(':pserver:c:/foo/bar')

57

>>> getrepopath(':pserver:c:/foo/bar')

58

'c:/foo/bar'

58

'c:/foo/bar'

59

>>> getrepopath(':pserver:truc@foo.bar:/foo/bar')

59

>>> getrepopath(':pserver:truc@foo.bar:/foo/bar')

60

'/foo/bar'

60

'/foo/bar'

61

>>> getrepopath(':pserver:truc@foo.bar:c:/foo/bar')

61

>>> getrepopath(':pserver:truc@foo.bar:c:/foo/bar')

62

'c:/foo/bar'

62

'c:/foo/bar'

63

"""

63

"""

64

# According to CVS manual, CVS paths are expressed like:

64

# According to CVS manual, CVS paths are expressed like:

65

# [:method:][[user][:password]@]hostname[:[port]]/path/to/repository

65

# [:method:][[user][:password]@]hostname[:[port]]/path/to/repository

66

#

66

#

67

# Unfortunately, Windows absolute paths start with a drive letter

67

# Unfortunately, Windows absolute paths start with a drive letter

68

# like 'c:' making it harder to parse. Here we assume that drive

68

# like 'c:' making it harder to parse. Here we assume that drive

69

# letters are only one character long and any CVS component before

69

# letters are only one character long and any CVS component before

70

# the repository path is at least 2 characters long, and use this

70

# the repository path is at least 2 characters long, and use this

71

# to disambiguate.

71

# to disambiguate.

72

parts = cvspath.split(':')

72

parts = cvspath.split(':')

73

if len(parts) == 1:

73

if len(parts) == 1:

74

return parts[0]

74

return parts[0]

75

# Here there is an ambiguous case if we have a port number

75

# Here there is an ambiguous case if we have a port number

76

# immediately followed by a Windows driver letter. We assume this

76

# immediately followed by a Windows driver letter. We assume this

77

# never happens and decide it must be CVS path component,

77

# never happens and decide it must be CVS path component,

78

# therefore ignoring it.

78

# therefore ignoring it.

79

if len(parts[-2]) > 1:

79

if len(parts[-2]) > 1:

80

return parts[-1].lstrip('0123456789')

80

return parts[-1].lstrip('0123456789')

81

return parts[-2] + ':' + parts[-1]

81

return parts[-2] + ':' + parts[-1]

82

83

def createlog(ui, directory=None, root="", rlog=True, cache=None):

83

def createlog(ui, directory=None, root="", rlog=True, cache=None):

84

'''Collect the CVS rlog'''

84

'''Collect the CVS rlog'''

85

86

# Because we store many duplicate commit log messages, reusing strings

86

# Because we store many duplicate commit log messages, reusing strings

87

# saves a lot of memory and pickle storage space.

87

# saves a lot of memory and pickle storage space.

88

_scache = {}

88

_scache = {}

89

def scache(s):

89

def scache(s):

90

"return a shared version of a string"

90

"return a shared version of a string"

91

return _scache.setdefault(s, s)

91

return _scache.setdefault(s, s)

92

93

ui.status(_('collecting CVS rlog\n'))

93

ui.status(_('collecting CVS rlog\n'))

94

95

log = [] # list of logentry objects containing the CVS state

95

log = [] # list of logentry objects containing the CVS state

96

97

# patterns to match in CVS (r)log output, by state of use

97

# patterns to match in CVS (r)log output, by state of use

98

re_00 = re.compile('RCS file: (.+)$')

98

re_00 = re.compile('RCS file: (.+)$')

99

re_01 = re.compile('cvs \\[r?log aborted\\]: (.+)$')

99

re_01 = re.compile('cvs \\[r?log aborted\\]: (.+)$')

100

re_02 = re.compile('cvs (r?log|server): (.+)\n$')

100

re_02 = re.compile('cvs (r?log|server): (.+)\n$')

101

re_03 = re.compile("(Cannot access.+CVSROOT)|(can't create temporary directory.+)$")

101

re_03 = re.compile("(Cannot access.+CVSROOT)|(can't create temporary directory.+)$")

102

re_10 = re.compile('Working file: (.+)$')

102

re_10 = re.compile('Working file: (.+)$')

103

re_20 = re.compile('symbolic names:')

103

re_20 = re.compile('symbolic names:')

104

re_30 = re.compile('\t(.+): ([\\d.]+)$')

104

re_30 = re.compile('\t(.+): ([\\d.]+)$')

105

re_31 = re.compile('----------------------------$')

105

re_31 = re.compile('----------------------------$')

106

re_32 = re.compile('=============================================================================$')

106

re_32 = re.compile('=============================================================================$')

107

re_50 = re.compile('revision ([\\d.]+)(\s+locked by:\s+.+;)?$')

107

re_50 = re.compile('revision ([\\d.]+)(\s+locked by:\s+.+;)?$')

108

re_60 = re.compile(r'date:\s+(.+);\s+author:\s+(.+);\s+state:\s+(.+?);(\s+lines:\s+(\+\d+)?\s+(-\d+)?;)?')

108

re_60 = re.compile(r'date:\s+(.+);\s+author:\s+(.+);\s+state:\s+(.+?);(\s+lines:\s+(\+\d+)?\s+(-\d+)?;)?')

109

re_70 = re.compile('branches: (.+);$')

109

re_70 = re.compile('branches: (.+);$')

110

111

file_added_re = re.compile(r'file [^/]+ was (initially )?added on branch')

111

file_added_re = re.compile(r'file [^/]+ was (initially )?added on branch')

112

113

prefix = '' # leading path to strip of what we get from CVS

113

prefix = '' # leading path to strip of what we get from CVS

114

115

if directory is None:

115

if directory is None:

116

# Current working directory

116

# Current working directory

117

118

# Get the real directory in the repository

118

# Get the real directory in the repository

119

try:

119

try:

120

prefix = file(os.path.join('CVS','Repository')).read().strip()

120

prefix = file(os.path.join('CVS','Repository')).read().strip()

121

if prefix == ".":

121

if prefix == ".":

122

prefix = ""

122

prefix = ""

123

directory = prefix

123

directory = prefix

124

except IOError:

124

except IOError:

125

raise logerror('Not a CVS sandbox')

125

raise logerror('Not a CVS sandbox')

126

127

if prefix and not prefix.endswith(os.sep):

127

if prefix and not prefix.endswith(os.sep):

128

prefix += os.sep

128

prefix += os.sep

129

130

# Use the Root file in the sandbox, if it exists

130

# Use the Root file in the sandbox, if it exists

131

try:

131

try:

132

root = file(os.path.join('CVS','Root')).read().strip()

132

root = file(os.path.join('CVS','Root')).read().strip()

133

except IOError:

133

except IOError:

134

pass

134

pass

135

136

if not root:

136

if not root:

137

root = os.environ.get('CVSROOT', '')

137

root = os.environ.get('CVSROOT', '')

138

139

# read log cache if one exists

139

# read log cache if one exists

140

oldlog = []

140

oldlog = []

141

date = None

141

date = None

142

143

if cache:

143

if cache:

144

cachedir = os.path.expanduser('~/.hg.cvsps')

144

cachedir = os.path.expanduser('~/.hg.cvsps')

145

if not os.path.exists(cachedir):

145

if not os.path.exists(cachedir):

146

os.mkdir(cachedir)

146

os.mkdir(cachedir)

147

148

# The cvsps cache pickle needs a uniquified name, based on the

148

# The cvsps cache pickle needs a uniquified name, based on the

149

# repository location. The address may have all sort of nasties

149

# repository location. The address may have all sort of nasties

150

# in it, slashes, colons and such. So here we take just the

150

# in it, slashes, colons and such. So here we take just the

151

# alphanumerics, concatenated in a way that does not mix up the

151

# alphanumerics, concatenated in a way that does not mix up the

152

# various components, so that

152

# various components, so that

153

# :pserver:user@server:/path

153

# :pserver:user@server:/path

154

# and

154

# and

155

# /pserver/user/server/path

155

# /pserver/user/server/path

156

# are mapped to different cache file names.

156

# are mapped to different cache file names.

157

cachefile = root.split(":") + [directory, "cache"]

157

cachefile = root.split(":") + [directory, "cache"]

158

cachefile = ['-'.join(re.findall(r'\w+', s)) for s in cachefile if s]

158

cachefile = ['-'.join(re.findall(r'\w+', s)) for s in cachefile if s]

159

cachefile = os.path.join(cachedir,

159

cachefile = os.path.join(cachedir,

160

'.'.join([s for s in cachefile if s]))

160

'.'.join([s for s in cachefile if s]))

161

162

if cache == 'update':

162

if cache == 'update':

163

try:

163

try:

164

ui.note(_('reading cvs log cache %s\n') % cachefile)

164

ui.note(_('reading cvs log cache %s\n') % cachefile)

165

oldlog = pickle.load(file(cachefile))

165

oldlog = pickle.load(file(cachefile))

166

ui.note(_('cache has %d log entries\n') % len(oldlog))

166

ui.note(_('cache has %d log entries\n') % len(oldlog))

167

except Exception, e:

167

except Exception, e:

168

ui.note(_('error reading cache: %r\n') % e)

168

ui.note(_('error reading cache: %r\n') % e)

169

170

if oldlog:

170

if oldlog:

171

date = oldlog[-1].date # last commit date as a (time,tz) tuple

171

date = oldlog[-1].date # last commit date as a (time,tz) tuple

172

date = util.datestr(date, '%Y/%m/%d %H:%M:%S %1%2')

172

date = util.datestr(date, '%Y/%m/%d %H:%M:%S %1%2')

173

174

# build the CVS commandline

174

# build the CVS commandline

175

cmd = ['cvs', '-q']

175

cmd = ['cvs', '-q']

176

if root:

176

if root:

177

cmd.append('-d%s' % root)

177

cmd.append('-d%s' % root)

178

p = util.normpath(getrepopath(root))

178

p = util.normpath(getrepopath(root))

179

if not p.endswith('/'):

179

if not p.endswith('/'):

180

p += '/'

180

p += '/'

181

prefix = p + util.normpath(prefix)

181

prefix = p + util.normpath(prefix)

182

cmd.append(['log', 'rlog'][rlog])

182

cmd.append(['log', 'rlog'][rlog])

183

if date:

183

if date:

184

# no space between option and date string

184

# no space between option and date string

185

cmd.append('-d>%s' % date)

185

cmd.append('-d>%s' % date)

186

cmd.append(directory)

186

cmd.append(directory)

187

188

# state machine begins here

188

# state machine begins here

189

tags = {} # dictionary of revisions on current file with their tags

189

tags = {} # dictionary of revisions on current file with their tags

190

state = 0

190

state = 0

191

store = False # set when a new record can be appended

191

store = False # set when a new record can be appended

192

193

cmd = [util.shellquote(arg) for arg in cmd]

193

cmd = [util.shellquote(arg) for arg in cmd]

194

ui.note(_("running %s\n") % (' '.join(cmd)))

194

ui.note(_("running %s\n") % (' '.join(cmd)))

195

ui.debug(_("prefix=%r directory=%r root=%r\n") % (prefix, directory, root))

195

ui.debug(_("prefix=%r directory=%r root=%r\n") % (prefix, directory, root))

196

197

pfp = util.popen(' '.join(cmd))

197

pfp = util.popen(' '.join(cmd))

198

peek = pfp.readline()

198

peek = pfp.readline()

199

while True:

199

while True:

200

line = peek

200

line = peek

201

if line == '':

201

if line == '':

202

break

202

break

203

peek = pfp.readline()

203

peek = pfp.readline()

204

if line.endswith('\n'):

204

if line.endswith('\n'):

205

line = line[:-1]

205

line = line[:-1]

206

#ui.debug('state=%d line=%r\n' % (state, line))

206

#ui.debug('state=%d line=%r\n' % (state, line))

207

208

if state == 0:

208

if state == 0:

209

# initial state, consume input until we see 'RCS file'

209

# initial state, consume input until we see 'RCS file'

210

match = re_00.match(line)

210

match = re_00.match(line)

211

if match:

211

if match:

212

rcs = match.group(1)

212

rcs = match.group(1)

213

tags = {}

213

tags = {}

214

if rlog:

214

if rlog:

215

filename = util.normpath(rcs[:-2])

215

filename = util.normpath(rcs[:-2])

216

if filename.startswith(prefix):

216

if filename.startswith(prefix):

217

filename = filename[len(prefix):]

217

filename = filename[len(prefix):]

218

if filename.startswith('/'):

218

if filename.startswith('/'):

219

filename = filename[1:]

219

filename = filename[1:]

220

if filename.startswith('Attic/'):

220

if filename.startswith('Attic/'):

221

filename = filename[6:]

221

filename = filename[6:]

222

else:

222

else:

223

filename = filename.replace('/Attic/', '/')

223

filename = filename.replace('/Attic/', '/')

224

state = 2

224

state = 2

225

continue

225

continue

226

state = 1

226

state = 1

227

continue

227

continue

228

match = re_01.match(line)

228

match = re_01.match(line)

229

if match:

229

if match:

230

raise Exception(match.group(1))

230

raise Exception(match.group(1))

231

match = re_02.match(line)

231

match = re_02.match(line)

232

if match:

232

if match:

233

raise Exception(match.group(2))

233

raise Exception(match.group(2))

234

if re_03.match(line):

234

if re_03.match(line):

235

raise Exception(line)

235

raise Exception(line)

236

237

elif state == 1:

237

elif state == 1:

238

# expect 'Working file' (only when using log instead of rlog)

238

# expect 'Working file' (only when using log instead of rlog)

239

match = re_10.match(line)

239

match = re_10.match(line)

240

assert match, _('RCS file must be followed by working file')

240

assert match, _('RCS file must be followed by working file')

241

filename = util.normpath(match.group(1))

241

filename = util.normpath(match.group(1))

242

state = 2

242

state = 2

243

244

elif state == 2:

244

elif state == 2:

245

# expect 'symbolic names'

245

# expect 'symbolic names'

246

if re_20.match(line):

246

if re_20.match(line):

247

state = 3

247

state = 3

248

249

elif state == 3:

249

elif state == 3:

250

# read the symbolic names and store as tags

250

# read the symbolic names and store as tags

251

match = re_30.match(line)

251

match = re_30.match(line)

252

if match:

252

if match:

253

rev = [int(x) for x in match.group(2).split('.')]

253

rev = [int(x) for x in match.group(2).split('.')]

254

255

# Convert magic branch number to an odd-numbered one

255

# Convert magic branch number to an odd-numbered one

256

revn = len(rev)

256

revn = len(rev)

257

if revn > 3 and (revn % 2) == 0 and rev[-2] == 0:

257

if revn > 3 and (revn % 2) == 0 and rev[-2] == 0:

258

rev = rev[:-2] + rev[-1:]

258

rev = rev[:-2] + rev[-1:]

259

rev = tuple(rev)

259

rev = tuple(rev)

260

261

if rev not in tags:

261

if rev not in tags:

262

tags[rev] = []

262

tags[rev] = []

263

tags[rev].append(match.group(1))

263

tags[rev].append(match.group(1))

264

265

elif re_31.match(line):

265

elif re_31.match(line):

266

state = 5

266

state = 5

267

elif re_32.match(line):

267

elif re_32.match(line):

268

state = 0

268

state = 0

269

270

elif state == 4:

270

elif state == 4:

271

# expecting '------' separator before first revision

271

# expecting '------' separator before first revision

272

if re_31.match(line):

272

if re_31.match(line):

273

state = 5

273

state = 5

274

else:

274

else:

275

assert not re_32.match(line), _('must have at least some revisions')

275

assert not re_32.match(line), _('must have at least some revisions')

276

277

elif state == 5:

277

elif state == 5:

278

# expecting revision number and possibly (ignored) lock indication

278

# expecting revision number and possibly (ignored) lock indication

279

# we create the logentry here from values stored in states 0 to 4,

279

# we create the logentry here from values stored in states 0 to 4,

280

# as this state is re-entered for subsequent revisions of a file.

280

# as this state is re-entered for subsequent revisions of a file.

281

match = re_50.match(line)

281

match = re_50.match(line)

282

assert match, _('expected revision number')

282

assert match, _('expected revision number')

283

e = logentry(rcs=scache(rcs), file=scache(filename),

283

e = logentry(rcs=scache(rcs), file=scache(filename),

284

revision=tuple([int(x) for x in match.group(1).split('.')]),

284

revision=tuple([int(x) for x in match.group(1).split('.')]),

285

branches=[], parent=None,

285

branches=[], parent=None,

286

synthetic=False)

286

synthetic=False)

287

state = 6

287

state = 6

288

289

elif state == 6:

289

elif state == 6:

290

# expecting date, author, state, lines changed

290

# expecting date, author, state, lines changed

291

match = re_60.match(line)

291

match = re_60.match(line)

292

assert match, _('revision must be followed by date line')

292

assert match, _('revision must be followed by date line')

293

d = match.group(1)

293

d = match.group(1)

294

if d[2] == '/':

294

if d[2] == '/':

295

# Y2K

295

# Y2K

296

d = '19' + d

296

d = '19' + d

297

298

if len(d.split()) != 3:

298

if len(d.split()) != 3:

299

# cvs log dates always in GMT

299

# cvs log dates always in GMT

300

d = d + ' UTC'

300

d = d + ' UTC'

301

e.date = util.parsedate(d, ['%y/%m/%d %H:%M:%S', '%Y/%m/%d %H:%M:%S', '%Y-%m-%d %H:%M:%S'])

301

e.date = util.parsedate(d, ['%y/%m/%d %H:%M:%S', '%Y/%m/%d %H:%M:%S', '%Y-%m-%d %H:%M:%S'])

302

e.author = scache(match.group(2))

302

e.author = scache(match.group(2))

303

e.dead = match.group(3).lower() == 'dead'

303

e.dead = match.group(3).lower() == 'dead'

304

305

if match.group(5):

305

if match.group(5):

306

if match.group(6):

306

if match.group(6):

307

e.lines = (int(match.group(5)), int(match.group(6)))

307

e.lines = (int(match.group(5)), int(match.group(6)))

308

else:

308

else:

309

e.lines = (int(match.group(5)), 0)

309

e.lines = (int(match.group(5)), 0)

310

elif match.group(6):

310

elif match.group(6):

311

e.lines = (0, int(match.group(6)))

311

e.lines = (0, int(match.group(6)))

312

else:

312

else:

313

e.lines = None

313

e.lines = None

314

e.comment = []

314

e.comment = []

315

state = 7

315

state = 7

316

317

elif state == 7:

317

elif state == 7:

318

# read the revision numbers of branches that start at this revision

318

# read the revision numbers of branches that start at this revision

319

# or store the commit log message otherwise

319

# or store the commit log message otherwise

320

m = re_70.match(line)

320

m = re_70.match(line)

321

if m:

321

if m:

322

e.branches = [tuple([int(y) for y in x.strip().split('.')])

322

e.branches = [tuple([int(y) for y in x.strip().split('.')])

323

for x in m.group(1).split(';')]

323

for x in m.group(1).split(';')]

324

state = 8

324

state = 8

325

elif re_31.match(line) and re_50.match(peek):

325

elif re_31.match(line) and re_50.match(peek):

326

state = 5

326

state = 5

327

store = True

327

store = True

328

elif re_32.match(line):

328

elif re_32.match(line):

329

state = 0

329

state = 0

330

store = True

330

store = True

331

else:

331

else:

332

e.comment.append(line)

332

e.comment.append(line)

333

334

elif state == 8:

334

elif state == 8:

335

# store commit log message

335

# store commit log message

336

if re_31.match(line):

336

if re_31.match(line):

337

state = 5

337

state = 5

338

store = True

338

store = True

339

elif re_32.match(line):

339

elif re_32.match(line):

340

state = 0

340

state = 0

341

store = True

341

store = True

342

else:

342

else:

343

e.comment.append(line)

343

e.comment.append(line)

344

345

# When a file is added on a branch B1, CVS creates a synthetic

345

# When a file is added on a branch B1, CVS creates a synthetic

346

# dead trunk revision 1.1 so that the branch has a root.

346

# dead trunk revision 1.1 so that the branch has a root.

347

# Likewise, if you merge such a file to a later branch B2 (one

347

# Likewise, if you merge such a file to a later branch B2 (one

348

# that already existed when the file was added on B1), CVS

348

# that already existed when the file was added on B1), CVS

349

# creates a synthetic dead revision 1.1.x.1 on B2. Don't drop

349

# creates a synthetic dead revision 1.1.x.1 on B2. Don't drop

350

# these revisions now, but mark them synthetic so

350

# these revisions now, but mark them synthetic so

351

# createchangeset() can take care of them.

351

# createchangeset() can take care of them.

352

if (store and

352

if (store and

353

e.dead and

353

e.dead and

354

e.revision[-1] == 1 and # 1.1 or 1.1.x.1

354

e.revision[-1] == 1 and # 1.1 or 1.1.x.1

355

len(e.comment) == 1 and

355

len(e.comment) == 1 and

356

file_added_re.match(e.comment[0])):

356

file_added_re.match(e.comment[0])):

357

ui.debug(_('found synthetic rev in %s: %r\n')

357

ui.debug(_('found synthetic rev in %s: %r\n')

358

% (e.rcs, e.comment[0]))

358

% (e.rcs, e.comment[0]))

359

e.synthetic = True

359

e.synthetic = True

360

361

if store:

361

if store:

362

# clean up the results and save in the log.

362

# clean up the results and save in the log.

363

store = False

363

store = False

364

e.tags = util.sort([scache(x) for x in tags.get(e.revision, [])])

364

e.tags = util.sort([scache(x) for x in tags.get(e.revision, [])])

365

e.comment = scache('\n'.join(e.comment))

365

e.comment = scache('\n'.join(e.comment))

366

367

revn = len(e.revision)

367

revn = len(e.revision)

368

if revn > 3 and (revn % 2) == 0:

368

if revn > 3 and (revn % 2) == 0:

369

e.branch = tags.get(e.revision[:-1], [None])[0]

369

e.branch = tags.get(e.revision[:-1], [None])[0]

370

else:

370

else:

371

e.branch = None

371

e.branch = None

372

373

log.append(e)

373

log.append(e)

374

375

if len(log) % 100 == 0:

375

if len(log) % 100 == 0:

376

ui.status(util.ellipsis('%d %s' % (len(log), e.file), 80)+'\n')

376

ui.status(util.ellipsis('%d %s' % (len(log), e.file), 80)+'\n')

377

378

listsort(log, key=lambda x:(x.rcs, x.revision))

378

listsort(log, key=lambda x:(x.rcs, x.revision))

379

380

# find parent revisions of individual files

380

# find parent revisions of individual files

381

versions = {}

381

versions = {}

382

for e in log:

382

for e in log:

383

branch = e.revision[:-1]

383

branch = e.revision[:-1]

384

p = versions.get((e.rcs, branch), None)

384

p = versions.get((e.rcs, branch), None)

385

if p is None:

385

if p is None:

386

p = e.revision[:-2]

386

p = e.revision[:-2]

387

e.parent = p

387

e.parent = p

388

versions[(e.rcs, branch)] = e.revision

388

versions[(e.rcs, branch)] = e.revision

389

390

# update the log cache

390

# update the log cache

391

if cache:

391

if cache:

392

if log:

392

if log:

393

# join up the old and new logs

393

# join up the old and new logs

394

listsort(log, key=lambda x:x.date)

394

listsort(log, key=lambda x:x.date)

395

396

if oldlog and oldlog[-1].date >= log[0].date:

396

if oldlog and oldlog[-1].date >= log[0].date:

397

raise logerror('Log cache overlaps with new log entries,'

397

raise logerror('Log cache overlaps with new log entries,'

398

' re-run without cache.')

398

' re-run without cache.')

399

400

log = oldlog + log

400

log = oldlog + log

401

402

# write the new cachefile

402

# write the new cachefile

403

ui.note(_('writing cvs log cache %s\n') % cachefile)

403

ui.note(_('writing cvs log cache %s\n') % cachefile)

404

pickle.dump(log, file(cachefile, 'w'))

404

pickle.dump(log, file(cachefile, 'w'))

405

else:

405

else:

406

log = oldlog

406

log = oldlog

407

408

ui.status(_('%d log entries\n') % len(log))

408

ui.status(_('%d log entries\n') % len(log))

409

410

return log

410

return log

411

412

413

class changeset(object):

413

class changeset(object):

414

'''Class changeset has the following attributes:

414

'''Class changeset has the following attributes:

415

.author - author name as CVS knows it

415

.author - author name as CVS knows it

416

.branch - name of branch this changeset is on, or None

416

.branch - name of branch this changeset is on, or None

417

.comment - commit message

417

.comment - commit message

418

.date - the commit date as a (time,tz) tuple

418

.date - the commit date as a (time,tz) tuple

419

.entries - list of logentry objects in this changeset

419

.entries - list of logentry objects in this changeset

420

.parents - list of one or two parent changesets

420

.parents - list of one or two parent changesets

421

.tags - list of tags on this changeset

421

.tags - list of tags on this changeset

422

.synthetic - from synthetic revision "file ... added on branch ..."

422

.synthetic - from synthetic revision "file ... added on branch ..."

423

'''

423

'''

424

def __init__(self, **entries):

424

def __init__(self, **entries):

425

self.__dict__.update(entries)

425

self.__dict__.update(entries)

426

427

def createchangeset(ui, log, fuzz=60, mergefrom=None, mergeto=None):

427

def createchangeset(ui, log, fuzz=60, mergefrom=None, mergeto=None):

428

'''Convert log into changesets.'''

428

'''Convert log into changesets.'''

429

430

ui.status(_('creating changesets\n'))

430

ui.status(_('creating changesets\n'))

431

432

# Merge changesets

432

# Merge changesets

433

434

listsort(log, key=lambda x:(x.comment, x.author, x.branch, x.date))

434

listsort(log, key=lambda x:(x.comment, x.author, x.branch, x.date))

435

436

changesets = []

436

changesets = []

437

files = {}

437

files = {}

438

c = None

438

c = None

439

for i, e in enumerate(log):

439

for i, e in enumerate(log):

440

441

# Check if log entry belongs to the current changeset or not.

441

# Check if log entry belongs to the current changeset or not.

442

if not (c and

442

if not (c and

443

e.comment == c.comment and

443

e.comment == c.comment and

444

e.author == c.author and

444

e.author == c.author and

445

e.branch == c.branch and

445

e.branch == c.branch and

446

((c.date[0] + c.date[1]) <=

446

((c.date[0] + c.date[1]) <=

447

(e.date[0] + e.date[1]) <=

447

(e.date[0] + e.date[1]) <=

448

(c.date[0] + c.date[1]) + fuzz) and

448

(c.date[0] + c.date[1]) + fuzz) and

449

e.file not in files):

449

e.file not in files):

450

c = changeset(comment=e.comment, author=e.author,

450

c = changeset(comment=e.comment, author=e.author,

451

branch=e.branch, date=e.date, entries=[])

451

branch=e.branch, date=e.date, entries=[])

452

changesets.append(c)

452

changesets.append(c)

453

files = {}

453

files = {}

454

if len(changesets) % 100 == 0:

454

if len(changesets) % 100 == 0:

455

t = '%d %s' % (len(changesets), repr(e.comment)[1:-1])

455

t = '%d %s' % (len(changesets), repr(e.comment)[1:-1])

456

ui.status(util.ellipsis(t, 80) + '\n')

456

ui.status(util.ellipsis(t, 80) + '\n')

457

458

c.entries.append(e)

458

c.entries.append(e)

459

files[e.file] = True

459

files[e.file] = True

460

c.date = e.date # changeset date is date of latest commit in it

460

c.date = e.date # changeset date is date of latest commit in it

461

462

# Mark synthetic changesets

462

# Mark synthetic changesets

463

464

for c in changesets:

464

for c in changesets:

465

# Synthetic revisions always get their own changeset, because

465

# Synthetic revisions always get their own changeset, because

466

# the log message includes the filename. E.g. if you add file3

466

# the log message includes the filename. E.g. if you add file3

467

# and file4 on a branch, you get four log entries and three

467

# and file4 on a branch, you get four log entries and three

468

# changesets:

468

# changesets:

469

# "File file3 was added on branch ..." (synthetic, 1 entry)

469

# "File file3 was added on branch ..." (synthetic, 1 entry)

470

# "File file4 was added on branch ..." (synthetic, 1 entry)

470

# "File file4 was added on branch ..." (synthetic, 1 entry)

471

# "Add file3 and file4 to fix ..." (real, 2 entries)

471

# "Add file3 and file4 to fix ..." (real, 2 entries)

472

# Hence the check for 1 entry here.

472

# Hence the check for 1 entry here.

473

c.synthetic = (len(c.entries) == 1 and c.entries[0].synthetic)

473

c.synthetic = (len(c.entries) == 1 and c.entries[0].synthetic)

474

475

# Sort files in each changeset

475

# Sort files in each changeset

476

477

for c in changesets:

477

for c in changesets:

478

def pathcompare(l, r):

478

def pathcompare(l, r):

479

'Mimic cvsps sorting order'

479

'Mimic cvsps sorting order'

480

l = l.split('/')

480

l = l.split('/')

481

r = r.split('/')

481

r = r.split('/')

482

nl = len(l)

482

nl = len(l)

483

nr = len(r)

483

nr = len(r)

484

n = min(nl, nr)

484

n = min(nl, nr)

485

for i in range(n):

485

for i in range(n):

486

if i + 1 == nl and nl < nr:

486

if i + 1 == nl and nl < nr:

487

return -1

487

return -1

488

elif i + 1 == nr and nl > nr:

488

elif i + 1 == nr and nl > nr:

489

return +1

489

return +1

490

elif l[i] < r[i]:

490

elif l[i] < r[i]:

491

return -1

491

return -1

492

elif l[i] > r[i]:

492

elif l[i] > r[i]:

493

return +1

493

return +1

494

return 0

494

return 0

495

def entitycompare(l, r):

495

def entitycompare(l, r):

496

return pathcompare(l.file, r.file)

496

return pathcompare(l.file, r.file)

497

498

c.entries.sort(entitycompare)

498

c.entries.sort(entitycompare)

499

500

# Sort changesets by date

500

# Sort changesets by date

501

502

def cscmp(l, r):

502

def cscmp(l, r):

503

d = sum(l.date) - sum(r.date)

503

d = sum(l.date) - sum(r.date)

504

if d:

504

if d:

505

return d

505

return d

506

507

# detect vendor branches and initial commits on a branch

507

# detect vendor branches and initial commits on a branch

508

le = {}

508

le = {}

509

for e in l.entries:

509

for e in l.entries:

510

le[e.rcs] = e.revision

510

le[e.rcs] = e.revision

511

re = {}

511

re = {}

512

for e in r.entries:

512

for e in r.entries:

513

re[e.rcs] = e.revision

513

re[e.rcs] = e.revision

514

515

d = 0

515

d = 0

516

for e in l.entries:

516

for e in l.entries:

517

if re.get(e.rcs, None) == e.parent:

517

if re.get(e.rcs, None) == e.parent:

518

assert not d

518

assert not d

519

d = 1

519

d = 1

520

break

520

break

521

522

for e in r.entries:

522

for e in r.entries:

523

if le.get(e.rcs, None) == e.parent:

523

if le.get(e.rcs, None) == e.parent:

524

assert not d

524

assert not d

525

d = -1

525

d = -1

526

break

526

break

527

528

return d

528

return d

529

530

changesets.sort(cscmp)

530

changesets.sort(cscmp)

531

532

# Collect tags

532

# Collect tags

533

534

globaltags = {}

534

globaltags = {}

535

for c in changesets:

535

for c in changesets:

536

tags = {}

536

tags = {}

537

for e in c.entries:

537

for e in c.entries:

538

for tag in e.tags:

538

for tag in e.tags:

539

# remember which is the latest changeset to have this tag

539

# remember which is the latest changeset to have this tag

540

globaltags[tag] = c

540

globaltags[tag] = c

541

542

for c in changesets:

542

for c in changesets:

543

tags = {}

543

tags = {}

544

for e in c.entries:

544

for e in c.entries:

545

for tag in e.tags:

545

for tag in e.tags:

546

tags[tag] = True

546

tags[tag] = True

547

# remember tags only if this is the latest changeset to have it

547

# remember tags only if this is the latest changeset to have it

548

c.tags = util.sort([tag for tag in tags if globaltags[tag] is c])

548

c.tags = util.sort([tag for tag in tags if globaltags[tag] is c])

549

550

# Find parent changesets, handle {{mergetobranch BRANCHNAME}}

550

# Find parent changesets, handle {{mergetobranch BRANCHNAME}}

551

# by inserting dummy changesets with two parents, and handle

551

# by inserting dummy changesets with two parents, and handle

552

# {{mergefrombranch BRANCHNAME}} by setting two parents.

552

# {{mergefrombranch BRANCHNAME}} by setting two parents.

553

554

if mergeto is None:

554

if mergeto is None:

555

mergeto = r'{{mergetobranch ([-\w]+)}}'

555

mergeto = r'{{mergetobranch ([-\w]+)}}'

556

if mergeto:

556

if mergeto:

557

mergeto = re.compile(mergeto)

557

mergeto = re.compile(mergeto)

558

559

if mergefrom is None:

559

if mergefrom is None:

560

mergefrom = r'{{mergefrombranch ([-\w]+)}}'

560

mergefrom = r'{{mergefrombranch ([-\w]+)}}'

561

if mergefrom:

561

if mergefrom:

562

mergefrom = re.compile(mergefrom)

562

mergefrom = re.compile(mergefrom)

563

564

versions = {} # changeset index where we saw any particular file version

564

versions = {} # changeset index where we saw any particular file version

565

branches = {} # changeset index where we saw a branch

565

branches = {} # changeset index where we saw a branch

566

n = len(changesets)

566

n = len(changesets)

567

i = 0

567

i = 0

568

while i<n:

568

while i<n:

569

c = changesets[i]

569

c = changesets[i]

570

571

for f in c.entries:

571

for f in c.entries:

572

versions[(f.rcs, f.revision)] = i

572

versions[(f.rcs, f.revision)] = i

573

574

p = None

574

p = None

575

if c.branch in branches:

575

if c.branch in branches:

576

p = branches[c.branch]

576

p = branches[c.branch]

577

else:

577

else:

578

for f in c.entries:

578

for f in c.entries:

579

p = max(p, versions.get((f.rcs, f.parent), None))

579

p = max(p, versions.get((f.rcs, f.parent), None))

580

581

c.parents = []

581

c.parents = []

582

if p is not None:

582

if p is not None:

583

p = changesets[p]

583

p = changesets[p]

584

585

# Ensure no changeset has a synthetic changeset as a parent.

585

# Ensure no changeset has a synthetic changeset as a parent.

586

while p.synthetic:

586

while p.synthetic:

587

assert len(p.parents) <= 1, \

587

assert len(p.parents) <= 1, \

588

_('synthetic changeset cannot have multiple parents')

588

_('synthetic changeset cannot have multiple parents')

589

if p.parents:

589

if p.parents:

590

p = p.parents[0]

590

p = p.parents[0]

591

else:

591

else:

592

p = None

592

p = None

593

break

593

break

594

595

if p is not None:

595

if p is not None:

596

c.parents.append(p)

596

c.parents.append(p)

597

598

if mergefrom:

598

if mergefrom:

599

m = mergefrom.search(c.comment)

599

m = mergefrom.search(c.comment)

600

if m:

600

if m:

601

m = m.group(1)

601

m = m.group(1)

602

if m == 'HEAD':

602

if m == 'HEAD':

603

m = None

603

m = None

604

if m in branches and c.branch != m:

604

candidate = changesets[branches[m]]

605

c.parents.append(changesets[branches[m]])

605

if m in branches and c.branch != m and not candidate.synthetic:

606

c.parents.append(candidate)

606

607

if mergeto:

608

if mergeto:

608

m = mergeto.search(c.comment)

609

m = mergeto.search(c.comment)

609

if m:

610

if m:

610

try:

611

try:

611

m = m.group(1)

612

m = m.group(1)

612

if m == 'HEAD':

613

if m == 'HEAD':

613

m = None

614

m = None

614

except:

615

except:

615

m = None # if no group found then merge to HEAD

616

m = None # if no group found then merge to HEAD

616

if m in branches and c.branch != m:

617

if m in branches and c.branch != m:

617

# insert empty changeset for merge

618

# insert empty changeset for merge

618

cc = changeset(author=c.author, branch=m, date=c.date,

619

cc = changeset(author=c.author, branch=m, date=c.date,

619

comment='convert-repo: CVS merge from branch %s' % c.branch,

620

comment='convert-repo: CVS merge from branch %s' % c.branch,

620

entries=[], tags=[], parents=[changesets[branches[m]], c])

621

entries=[], tags=[], parents=[changesets[branches[m]], c])

621

changesets.insert(i + 1, cc)

622

changesets.insert(i + 1, cc)

622

branches[m] = i + 1

623

branches[m] = i + 1

623

624

# adjust our loop counters now we have inserted a new entry

625

# adjust our loop counters now we have inserted a new entry

625

n += 1

626

n += 1

626

i += 2

627

i += 2

627

continue

628

continue

628

629

branches[c.branch] = i

630

branches[c.branch] = i

630

i += 1

631

i += 1

631

632

# Drop synthetic changesets (safe now that we have ensured no other

633

# Drop synthetic changesets (safe now that we have ensured no other

633

# changesets can have them as parents).

634

# changesets can have them as parents).

634

i = 0

635

i = 0

635

while i < len(changesets):

636

while i < len(changesets):

636

if changesets[i].synthetic:

637

if changesets[i].synthetic:

637

del changesets[i]

638

del changesets[i]

638

else:

639

else:

639

i += 1

640

i += 1

640

641

# Number changesets

642

# Number changesets

642

643

for i, c in enumerate(changesets):

644

for i, c in enumerate(changesets):

644

c.id = i + 1

645

c.id = i + 1

645

646

ui.status(_('%d changeset entries\n') % len(changesets))

647

ui.status(_('%d changeset entries\n') % len(changesets))

647

648

return changesets

649

return changesets

649

650

651

def debugcvsps(ui, *args, **opts):

652

def debugcvsps(ui, *args, **opts):

652

'''Read CVS rlog for current directory or named path in repository, and

653

'''Read CVS rlog for current directory or named path in repository, and

653

convert the log to changesets based on matching commit log entries and dates.'''

654

convert the log to changesets based on matching commit log entries and dates.'''

654

655

if opts["new_cache"]:

656

if opts["new_cache"]:

656

cache = "write"

657

cache = "write"

657

elif opts["update_cache"]:

658

elif opts["update_cache"]:

658

cache = "update"

659

cache = "update"

659

else:

660

else:

660

cache = None

661

cache = None

661

662

revisions = opts["revisions"]

663

revisions = opts["revisions"]

663

664

try:

665

try:

665

if args:

666

if args:

666

log = []

667

log = []

667

for d in args:

668

for d in args:

668

log += createlog(ui, d, root=opts["root"], cache=cache)

669

log += createlog(ui, d, root=opts["root"], cache=cache)

669

else:

670

else:

670

log = createlog(ui, root=opts["root"], cache=cache)

671

log = createlog(ui, root=opts["root"], cache=cache)

671

except logerror, e:

672

except logerror, e:

672

ui.write("%r\n"%e)

673

ui.write("%r\n"%e)

673

return

674

return

674

675

changesets = createchangeset(ui, log, opts["fuzz"])

676

changesets = createchangeset(ui, log, opts["fuzz"])

676

del log

677

del log

677

678

# Print changesets (optionally filtered)

679

# Print changesets (optionally filtered)

679

680

off = len(revisions)

681

off = len(revisions)

681

branches = {} # latest version number in each branch

682

branches = {} # latest version number in each branch

682

ancestors = {} # parent branch

683

ancestors = {} # parent branch

683

for cs in changesets:

684

for cs in changesets:

684

685

if opts["ancestors"]:

686

if opts["ancestors"]:

686

if cs.branch not in branches and cs.parents and cs.parents[0].id:

687

if cs.branch not in branches and cs.parents and cs.parents[0].id:

687

ancestors[cs.branch] = changesets[cs.parents[0].id-1].branch, cs.parents[0].id

688

ancestors[cs.branch] = changesets[cs.parents[0].id-1].branch, cs.parents[0].id

688

branches[cs.branch] = cs.id

689

branches[cs.branch] = cs.id

689

690

# limit by branches

691

# limit by branches

691

if opts["branches"] and (cs.branch or 'HEAD') not in opts["branches"]:

692

if opts["branches"] and (cs.branch or 'HEAD') not in opts["branches"]:

692

continue

693

continue

693

694

if not off:

695

if not off:

695

# Note: trailing spaces on several lines here are needed to have

696

# Note: trailing spaces on several lines here are needed to have

696

# bug-for-bug compatibility with cvsps.

697

# bug-for-bug compatibility with cvsps.

697

ui.write('---------------------\n')

698

ui.write('---------------------\n')

698

ui.write('PatchSet %d \n' % cs.id)

699

ui.write('PatchSet %d \n' % cs.id)

699

ui.write('Date: %s\n' % util.datestr(cs.date, '%Y/%m/%d %H:%M:%S %1%2'))

700

ui.write('Date: %s\n' % util.datestr(cs.date, '%Y/%m/%d %H:%M:%S %1%2'))

700

ui.write('Author: %s\n' % cs.author)

701

ui.write('Author: %s\n' % cs.author)

701

ui.write('Branch: %s\n' % (cs.branch or 'HEAD'))

702

ui.write('Branch: %s\n' % (cs.branch or 'HEAD'))

702

ui.write('Tag%s: %s \n' % (['', 's'][len(cs.tags)>1],

703

ui.write('Tag%s: %s \n' % (['', 's'][len(cs.tags)>1],

703

','.join(cs.tags) or '(none)'))

704

','.join(cs.tags) or '(none)'))

704

if opts["parents"] and cs.parents:

705

if opts["parents"] and cs.parents:

705

if len(cs.parents)>1:

706

if len(cs.parents)>1:

706

ui.write('Parents: %s\n' % (','.join([str(p.id) for p in cs.parents])))

707

ui.write('Parents: %s\n' % (','.join([str(p.id) for p in cs.parents])))

707

else:

708

else:

708

ui.write('Parent: %d\n' % cs.parents[0].id)

709

ui.write('Parent: %d\n' % cs.parents[0].id)

709

710

if opts["ancestors"]:

711

if opts["ancestors"]:

711

b = cs.branch

712

b = cs.branch

712

r = []

713

r = []

713

while b:

714

while b:

714

b, c = ancestors[b]

715

b, c = ancestors[b]

715

r.append('%s:%d:%d' % (b or "HEAD", c, branches[b]))

716

r.append('%s:%d:%d' % (b or "HEAD", c, branches[b]))

716

if r:

717

if r:

717

ui.write('Ancestors: %s\n' % (','.join(r)))

718

ui.write('Ancestors: %s\n' % (','.join(r)))

718

719

ui.write('Log:\n')

720

ui.write('Log:\n')

720

ui.write('%s\n\n' % cs.comment)

721

ui.write('%s\n\n' % cs.comment)

721

ui.write('Members: \n')

722

ui.write('Members: \n')

722

for f in cs.entries:

723

for f in cs.entries:

723

fn = f.file

724

fn = f.file

724

if fn.startswith(opts["prefix"]):

725

if fn.startswith(opts["prefix"]):

725

fn = fn[len(opts["prefix"]):]

726

fn = fn[len(opts["prefix"]):]

726

ui.write('\t%s:%s->%s%s \n' % (fn, '.'.join([str(x) for x in f.parent]) or 'INITIAL',

727

ui.write('\t%s:%s->%s%s \n' % (fn, '.'.join([str(x) for x in f.parent]) or 'INITIAL',

727

'.'.join([str(x) for x in f.revision]), ['', '(DEAD)'][f.dead]))

728

'.'.join([str(x) for x in f.revision]), ['', '(DEAD)'][f.dead]))

728

ui.write('\n')

729

ui.write('\n')

729

730

# have we seen the start tag?

731

# have we seen the start tag?

731

if revisions and off:

732

if revisions and off:

732

if revisions[0] == str(cs.id) or \

733

if revisions[0] == str(cs.id) or \

733

revisions[0] in cs.tags:

734

revisions[0] in cs.tags:

734

off = False

735

off = False

735

736

# see if we reached the end tag

737

# see if we reached the end tag

737

if len(revisions)>1 and not off:

738

if len(revisions)>1 and not off:

738

if revisions[1] == str(cs.id) or \

739

if revisions[1] == str(cs.id) or \

739

revisions[1] in cs.tags:

740

revisions[1] in cs.tags:

740

break

741

break

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             #
             # Mercurial built-in replacement for cvsps.
             #
             # Copyright 2008, Frank Kingswood <frank@kingswood-consulting.co.uk>
             #
             # This software may be used and distributed according to the terms
             # of the GNU General Public License, incorporated herein by reference.
             import os
             import re
             import cPickle as pickle
             from mercurial import util
             from mercurial.i18n import _
             def listsort(list, key):
                 "helper to sort by key in Python 2.3"
                 try:
                     list.sort(key=key)
                 except TypeError:
                     list.sort(lambda l, r: cmp(key(l), key(r)))
             class logentry(object):
                 '''Class logentry has the following attributes:
                     .author    - author name as CVS knows it
                     .branch    - name of branch this revision is on
                     .branches  - revision tuple of branches starting at this revision
                     .comment   - commit message
                     .date      - the commit date as a (time, tz) tuple
                     .dead      - true if file revision is dead
                     .file      - Name of file
                     .lines     - a tuple (+lines, -lines) or None
                     .parent    - Previous revision of this entry
                     .rcs       - name of file as returned from CVS
                     .revision  - revision number as tuple
                     .tags      - list of tags on the file
                     .synthetic - is this a synthetic "file ... added on ..." revision?
                 '''
                 def __init__(self, **entries):
                     self.__dict__.update(entries)
             class logerror(Exception):
                 pass
             def getrepopath(cvspath):
                 """Return the repository path from a CVS path.
                 >>> getrepopath('/foo/bar')
                 '/foo/bar'
                 >>> getrepopath('c:/foo/bar')
                 'c:/foo/bar'
                 >>> getrepopath(':pserver:10/foo/bar')
                 '/foo/bar'
                 >>> getrepopath(':pserver:10c:/foo/bar')
                 '/foo/bar'
                 >>> getrepopath(':pserver:/foo/bar')
                 '/foo/bar'
                 >>> getrepopath(':pserver:c:/foo/bar')
                 'c:/foo/bar'
                 >>> getrepopath(':pserver:truc@foo.bar:/foo/bar')
                 '/foo/bar'
                 >>> getrepopath(':pserver:truc@foo.bar:c:/foo/bar')
                 'c:/foo/bar'
                 """
                 # According to CVS manual, CVS paths are expressed like:
                 # [:method:][[user][:password]@]hostname[:[port]]/path/to/repository
                 #
                 # Unfortunately, Windows absolute paths start with a drive letter
                 # like 'c:' making it harder to parse. Here we assume that drive
                 # letters are only one character long and any CVS component before
                 # the repository path is at least 2 characters long, and use this
                 # to disambiguate.
                 parts = cvspath.split(':')
                 if len(parts) == 1:
                     return parts[0]
                 # Here there is an ambiguous case if we have a port number
                 # immediately followed by a Windows driver letter. We assume this
                 # never happens and decide it must be CVS path component,
                 # therefore ignoring it.
                 if len(parts[-2]) > 1:
                     return parts[-1].lstrip('0123456789')
                 return parts[-2] + ':' + parts[-1]
             def createlog(ui, directory=None, root="", rlog=True, cache=None):
                 '''Collect the CVS rlog'''
                 # Because we store many duplicate commit log messages, reusing strings
                 # saves a lot of memory and pickle storage space.
                 _scache = {}
                 def scache(s):
                     "return a shared version of a string"
                     return _scache.setdefault(s, s)
                 ui.status(_('collecting CVS rlog\n'))
                 log = []      # list of logentry objects containing the CVS state
                 # patterns to match in CVS (r)log output, by state of use
                 re_00 = re.compile('RCS file: (.+)$')
                 re_01 = re.compile('cvs \\[r?log aborted\\]: (.+)$')
                 re_02 = re.compile('cvs (r?log|server): (.+)\n$')
                 re_03 = re.compile("(Cannot access.+CVSROOT)|(can't create temporary directory.+)$")
                 re_10 = re.compile('Working file: (.+)$')
                 re_20 = re.compile('symbolic names:')
                 re_30 = re.compile('\t(.+): ([\\d.]+)$')
                 re_31 = re.compile('----------------------------$')
                 re_32 = re.compile('=============================================================================$')
                 re_50 = re.compile('revision ([\\d.]+)(\s+locked by:\s+.+;)?$')
                 re_60 = re.compile(r'date:\s+(.+);\s+author:\s+(.+);\s+state:\s+(.+?);(\s+lines:\s+(\+\d+)?\s+(-\d+)?;)?')
                 re_70 = re.compile('branches: (.+);$')
                 file_added_re = re.compile(r'file [^/]+ was (initially )?added on branch')
                 prefix = ''   # leading path to strip of what we get from CVS
                 if directory is None:
                     # Current working directory
                     # Get the real directory in the repository
                     try:
                         prefix = file(os.path.join('CVS','Repository')).read().strip()
                         if prefix == ".":
                             prefix = ""
                         directory = prefix
                     except IOError:
                         raise logerror('Not a CVS sandbox')
                     if prefix and not prefix.endswith(os.sep):
                         prefix += os.sep
                     # Use the Root file in the sandbox, if it exists
                     try:
                         root = file(os.path.join('CVS','Root')).read().strip()
                     except IOError:
                         pass
                 if not root:
                     root = os.environ.get('CVSROOT', '')
                 # read log cache if one exists
                 oldlog = []
                 date = None
                 if cache:
                     cachedir = os.path.expanduser('~/.hg.cvsps')
                     if not os.path.exists(cachedir):
                         os.mkdir(cachedir)
                     # The cvsps cache pickle needs a uniquified name, based on the
                     # repository location. The address may have all sort of nasties
                     # in it, slashes, colons and such. So here we take just the
                     # alphanumerics, concatenated in a way that does not mix up the
                     # various components, so that
                     #    :pserver:user@server:/path
                     # and
                     #    /pserver/user/server/path
                     # are mapped to different cache file names.
                     cachefile = root.split(":") + [directory, "cache"]
                     cachefile = ['-'.join(re.findall(r'\w+', s)) for s in cachefile if s]
                     cachefile = os.path.join(cachedir,
                                              '.'.join([s for s in cachefile if s]))
                 if cache == 'update':
                     try:
                         ui.note(_('reading cvs log cache %s\n') % cachefile)
                         oldlog = pickle.load(file(cachefile))
                         ui.note(_('cache has %d log entries\n') % len(oldlog))
                     except Exception, e:
                         ui.note(_('error reading cache: %r\n') % e)
                     if oldlog:
                         date = oldlog[-1].date    # last commit date as a (time,tz) tuple
                         date = util.datestr(date, '%Y/%m/%d %H:%M:%S %1%2')
                 # build the CVS commandline
                 cmd = ['cvs', '-q']
                 if root:
                     cmd.append('-d%s' % root)
                     p = util.normpath(getrepopath(root))
                     if not p.endswith('/'):
                         p += '/'
                     prefix = p + util.normpath(prefix)
                 cmd.append(['log', 'rlog'][rlog])
                 if date:
                     # no space between option and date string
                     cmd.append('-d>%s' % date)
                 cmd.append(directory)
                 # state machine begins here
                 tags = {}     # dictionary of revisions on current file with their tags
                 state = 0
                 store = False # set when a new record can be appended
                 cmd = [util.shellquote(arg) for arg in cmd]
                 ui.note(_("running %s\n") % (' '.join(cmd)))
                 ui.debug(_("prefix=%r directory=%r root=%r\n") % (prefix, directory, root))
                 pfp = util.popen(' '.join(cmd))
                 peek = pfp.readline()
                 while True:
                     line = peek
                     if line == '':
                         break
                     peek = pfp.readline()
                     if line.endswith('\n'):
                         line = line[:-1]
                     #ui.debug('state=%d line=%r\n' % (state, line))
                     if state == 0:
                         # initial state, consume input until we see 'RCS file'
                         match = re_00.match(line)
                         if match:
                             rcs = match.group(1)
                             tags = {}
                             if rlog:
                                 filename = util.normpath(rcs[:-2])
                                 if filename.startswith(prefix):
                                     filename = filename[len(prefix):]
                                 if filename.startswith('/'):
                                     filename = filename[1:]
                                 if filename.startswith('Attic/'):
                                     filename = filename[6:]
                                 else:
                                     filename = filename.replace('/Attic/', '/')
                                 state = 2
                                 continue
                             state = 1
                             continue
                         match = re_01.match(line)
                         if match:
                             raise Exception(match.group(1))
                         match = re_02.match(line)
                         if match:
                             raise Exception(match.group(2))
                         if re_03.match(line):
                             raise Exception(line)
                     elif state == 1:
                         # expect 'Working file' (only when using log instead of rlog)
                         match = re_10.match(line)
                         assert match, _('RCS file must be followed by working file')
                         filename = util.normpath(match.group(1))
                         state = 2
                     elif state == 2:
                         # expect 'symbolic names'
                         if re_20.match(line):
                             state = 3
                     elif state == 3:
                         # read the symbolic names and store as tags
                         match = re_30.match(line)
                         if match:
                             rev = [int(x) for x in match.group(2).split('.')]
                             # Convert magic branch number to an odd-numbered one
                             revn = len(rev)
                             if revn > 3 and (revn % 2) == 0 and rev[-2] == 0:
                                 rev = rev[:-2] + rev[-1:]
                             rev = tuple(rev)
                             if rev not in tags:
                                 tags[rev] = []
                             tags[rev].append(match.group(1))
                         elif re_31.match(line):
                             state = 5
                         elif re_32.match(line):
                             state = 0
                     elif state == 4:
                         # expecting '------' separator before first revision
                         if re_31.match(line):
                             state = 5
                         else:
                             assert not re_32.match(line), _('must have at least some revisions')
                     elif state == 5:
                         # expecting revision number and possibly (ignored) lock indication
                         # we create the logentry here from values stored in states 0 to 4,
                         # as this state is re-entered for subsequent revisions of a file.
                         match = re_50.match(line)
                         assert match, _('expected revision number')
                         e = logentry(rcs=scache(rcs), file=scache(filename),
                                 revision=tuple([int(x) for x in match.group(1).split('.')]),
                                 branches=[], parent=None,
                                 synthetic=False)
                         state = 6
                     elif state == 6:
                         # expecting date, author, state, lines changed
                         match = re_60.match(line)
                         assert match, _('revision must be followed by date line')
                         d = match.group(1)
                         if d[2] == '/':
                             # Y2K
                             d = '19' + d
                         if len(d.split()) != 3:
                             # cvs log dates always in GMT
                             d = d + ' UTC'
                         e.date = util.parsedate(d, ['%y/%m/%d %H:%M:%S', '%Y/%m/%d %H:%M:%S', '%Y-%m-%d %H:%M:%S'])
                         e.author = scache(match.group(2))
                         e.dead = match.group(3).lower() == 'dead'
                         if match.group(5):
                             if match.group(6):
                                 e.lines = (int(match.group(5)), int(match.group(6)))
                             else:
                                 e.lines = (int(match.group(5)), 0)
                         elif match.group(6):
                             e.lines = (0, int(match.group(6)))
                         else:
                             e.lines = None
                         e.comment = []
                         state = 7
                     elif state == 7:
                         # read the revision numbers of branches that start at this revision
                         # or store the commit log message otherwise
                         m = re_70.match(line)
                         if m:
                             e.branches = [tuple([int(y) for y in x.strip().split('.')])
                                             for x in m.group(1).split(';')]
                             state = 8
                         elif re_31.match(line) and re_50.match(peek):
                             state = 5
                             store = True
                         elif re_32.match(line):
                             state = 0
                             store = True
                         else:
                             e.comment.append(line)
                     elif state == 8:
                         # store commit log message
                         if re_31.match(line):
                             state = 5
                             store = True
                         elif re_32.match(line):
                             state = 0
                             store = True
                         else:
                             e.comment.append(line)
                     # When a file is added on a branch B1, CVS creates a synthetic
                     # dead trunk revision 1.1 so that the branch has a root.
                     # Likewise, if you merge such a file to a later branch B2 (one
                     # that already existed when the file was added on B1), CVS
                     # creates a synthetic dead revision 1.1.x.1 on B2.  Don't drop
                     # these revisions now, but mark them synthetic so
                     # createchangeset() can take care of them.
                     if (store and
                           e.dead and
                           e.revision[-1] == 1 and      # 1.1 or 1.1.x.1
                           len(e.comment) == 1 and
                           file_added_re.match(e.comment[0])):
                         ui.debug(_('found synthetic rev in %s: %r\n')
                                  % (e.rcs, e.comment[0]))
                         e.synthetic = True
                     if store:
                         # clean up the results and save in the log.
                         store = False
                         e.tags = util.sort([scache(x) for x in tags.get(e.revision, [])])
                         e.comment = scache('\n'.join(e.comment))
                         revn = len(e.revision)
                         if revn > 3 and (revn % 2) == 0:
                             e.branch = tags.get(e.revision[:-1], [None])[0]
                         else:
                             e.branch = None
                         log.append(e)
                         if len(log) % 100 == 0:
                             ui.status(util.ellipsis('%d %s' % (len(log), e.file), 80)+'\n')
                 listsort(log, key=lambda x:(x.rcs, x.revision))
                 # find parent revisions of individual files
                 versions = {}
                 for e in log:
                     branch = e.revision[:-1]
                     p = versions.get((e.rcs, branch), None)
                     if p is None:
                         p = e.revision[:-2]
                     e.parent = p
                     versions[(e.rcs, branch)] = e.revision
                 # update the log cache
                 if cache:
                     if log:
                         # join up the old and new logs
                         listsort(log, key=lambda x:x.date)
                         if oldlog and oldlog[-1].date >= log[0].date:
                             raise logerror('Log cache overlaps with new log entries,'
                                            ' re-run without cache.')
                         log = oldlog + log
                         # write the new cachefile
                         ui.note(_('writing cvs log cache %s\n') % cachefile)
                         pickle.dump(log, file(cachefile, 'w'))
                     else:
                         log = oldlog
                 ui.status(_('%d log entries\n') % len(log))
                 return log
             class changeset(object):
                 '''Class changeset has the following attributes:
                     .author    - author name as CVS knows it
                     .branch    - name of branch this changeset is on, or None
                     .comment   - commit message
                     .date      - the commit date as a (time,tz) tuple
                     .entries   - list of logentry objects in this changeset
                     .parents   - list of one or two parent changesets
                     .tags      - list of tags on this changeset
                     .synthetic - from synthetic revision "file ... added on branch ..."
                 '''
                 def __init__(self, **entries):
                     self.__dict__.update(entries)
             def createchangeset(ui, log, fuzz=60, mergefrom=None, mergeto=None):
                 '''Convert log into changesets.'''
                 ui.status(_('creating changesets\n'))
                 # Merge changesets
                 listsort(log, key=lambda x:(x.comment, x.author, x.branch, x.date))
                 changesets = []
                 files = {}
                 c = None
                 for i, e in enumerate(log):
                     # Check if log entry belongs to the current changeset or not.
                     if not (c and
                               e.comment == c.comment and
                               e.author == c.author and
                               e.branch == c.branch and
                               ((c.date[0] + c.date[1]) <=
                                (e.date[0] + e.date[1]) <=
                                (c.date[0] + c.date[1]) + fuzz) and
                               e.file not in files):
                         c = changeset(comment=e.comment, author=e.author,
                                       branch=e.branch, date=e.date, entries=[])
                         changesets.append(c)
                         files = {}
                         if len(changesets) % 100 == 0:
                             t = '%d %s' % (len(changesets), repr(e.comment)[1:-1])
                             ui.status(util.ellipsis(t, 80) + '\n')
                     c.entries.append(e)
                     files[e.file] = True
                     c.date = e.date       # changeset date is date of latest commit in it
                 # Mark synthetic changesets
                 for c in changesets:
                     # Synthetic revisions always get their own changeset, because
                     # the log message includes the filename.  E.g. if you add file3
                     # and file4 on a branch, you get four log entries and three
                     # changesets:
                     #   "File file3 was added on branch ..." (synthetic, 1 entry)
                     #   "File file4 was added on branch ..." (synthetic, 1 entry)
                     #   "Add file3 and file4 to fix ..."     (real, 2 entries)
                     # Hence the check for 1 entry here.
                     c.synthetic = (len(c.entries) == 1 and c.entries[0].synthetic)
                 # Sort files in each changeset
                 for c in changesets:
                     def pathcompare(l, r):
                         'Mimic cvsps sorting order'
                         l = l.split('/')
                         r = r.split('/')
                         nl = len(l)
                         nr = len(r)
                         n = min(nl, nr)
                         for i in range(n):
                             if i + 1 == nl and nl < nr:
                                 return -1
                             elif i + 1 == nr and nl > nr:
                                 return +1
                             elif l[i] < r[i]:
                                 return -1
                             elif l[i] > r[i]:
                                 return +1
                         return 0
                     def entitycompare(l, r):
                         return pathcompare(l.file, r.file)
                     c.entries.sort(entitycompare)
                 # Sort changesets by date
                 def cscmp(l, r):
                     d = sum(l.date) - sum(r.date)
                     if d:
                         return d
                     # detect vendor branches and initial commits on a branch
                     le = {}
                     for e in l.entries:
                         le[e.rcs] = e.revision
                     re = {}
                     for e in r.entries:
                         re[e.rcs] = e.revision
                     d = 0
                     for e in l.entries:
                         if re.get(e.rcs, None) == e.parent:
                             assert not d
                             d = 1
                             break
                     for e in r.entries:
                         if le.get(e.rcs, None) == e.parent:
                             assert not d
                             d = -1
                             break
                     return d
                 changesets.sort(cscmp)
                 # Collect tags
                 globaltags = {}
                 for c in changesets:
                     tags = {}
                     for e in c.entries:
                         for tag in e.tags:
                             # remember which is the latest changeset to have this tag
                             globaltags[tag] = c
                 for c in changesets:
                     tags = {}
                     for e in c.entries:
                         for tag in e.tags:
                             tags[tag] = True
                     # remember tags only if this is the latest changeset to have it
                     c.tags = util.sort([tag for tag in tags if globaltags[tag] is c])
                 # Find parent changesets, handle {{mergetobranch BRANCHNAME}}
                 # by inserting dummy changesets with two parents, and handle
                 # {{mergefrombranch BRANCHNAME}} by setting two parents.
                 if mergeto is None:
                     mergeto = r'{{mergetobranch ([-\w]+)}}'
                 if mergeto:
                     mergeto = re.compile(mergeto)
                 if mergefrom is None:
                     mergefrom = r'{{mergefrombranch ([-\w]+)}}'
                 if mergefrom:
                     mergefrom = re.compile(mergefrom)
                 versions = {}    # changeset index where we saw any particular file version
                 branches = {}    # changeset index where we saw a branch
                 n = len(changesets)
                 i = 0
                 while i<n:
                     c = changesets[i]
                     for f in c.entries:
                         versions[(f.rcs, f.revision)] = i
                     p = None
                     if c.branch in branches:
                         p = branches[c.branch]
                     else:
                         for f in c.entries:
                             p = max(p, versions.get((f.rcs, f.parent), None))
                     c.parents = []
                     if p is not None:
                         p = changesets[p]
                         # Ensure no changeset has a synthetic changeset as a parent.
                         while p.synthetic:
                             assert len(p.parents) <= 1, \
                                    _('synthetic changeset cannot have multiple parents')
                             if p.parents:
                                 p = p.parents[0]
                             else:
                                 p = None
                                 break
                         if p is not None:
                             c.parents.append(p)
                     if mergefrom:
                         m = mergefrom.search(c.comment)
                         if m:
                             m = m.group(1)
                             if m == 'HEAD':
                                 m = None
-                            if m in branches and c.branch != m:
+                            candidate = changesets[branches[m]]
-                                c.parents.append(changesets[branches[m]])
+                            if m in branches and c.branch != m and not candidate.synthetic:
+                                c.parents.append(candidate)
                     if mergeto:
                         m = mergeto.search(c.comment)
                         if m:
                             try:
                                 m = m.group(1)
                                 if m == 'HEAD':
                                     m = None
                             except:
                                 m = None   # if no group found then merge to HEAD
                             if m in branches and c.branch != m:
                                 # insert empty changeset for merge
                                 cc = changeset(author=c.author, branch=m, date=c.date,
                                         comment='convert-repo: CVS merge from branch %s' % c.branch,
                                         entries=[], tags=[], parents=[changesets[branches[m]], c])
                                 changesets.insert(i + 1, cc)
                                 branches[m] = i + 1
                                 # adjust our loop counters now we have inserted a new entry
                                 n += 1
                                 i += 2
                                 continue
                     branches[c.branch] = i
                     i += 1
                 # Drop synthetic changesets (safe now that we have ensured no other
                 # changesets can have them as parents).
                 i = 0
                 while i < len(changesets):
                     if changesets[i].synthetic:
                         del changesets[i]
                     else:
                         i += 1
                 # Number changesets
                 for i, c in enumerate(changesets):
                     c.id = i + 1
                 ui.status(_('%d changeset entries\n') % len(changesets))
                 return changesets
             def debugcvsps(ui, *args, **opts):
                 '''Read CVS rlog for current directory or named path in repository, and
                 convert the log to changesets based on matching commit log entries and dates.'''
                 if opts["new_cache"]:
                     cache = "write"
                 elif opts["update_cache"]:
                     cache = "update"
                 else:
                     cache = None
                 revisions = opts["revisions"]
                 try:
                     if args:
                         log = []
                         for d in args:
                             log += createlog(ui, d, root=opts["root"], cache=cache)
                     else:
                         log = createlog(ui, root=opts["root"], cache=cache)
                 except logerror, e:
                     ui.write("%r\n"%e)
                     return
                 changesets = createchangeset(ui, log, opts["fuzz"])
                 del log
                 # Print changesets (optionally filtered)
                 off = len(revisions)
                 branches = {}    # latest version number in each branch
                 ancestors = {}   # parent branch
                 for cs in changesets:
                     if opts["ancestors"]:
                         if cs.branch not in branches and cs.parents and cs.parents[0].id:
                             ancestors[cs.branch] = changesets[cs.parents[0].id-1].branch, cs.parents[0].id
                         branches[cs.branch] = cs.id
                     # limit by branches
                     if opts["branches"] and (cs.branch or 'HEAD') not in opts["branches"]:
                         continue
                     if not off:
                         # Note: trailing spaces on several lines here are needed to have
                         #       bug-for-bug compatibility with cvsps.
                         ui.write('---------------------\n')
                         ui.write('PatchSet %d \n' % cs.id)
                         ui.write('Date: %s\n' % util.datestr(cs.date, '%Y/%m/%d %H:%M:%S %1%2'))
                         ui.write('Author: %s\n' % cs.author)
                         ui.write('Branch: %s\n' % (cs.branch or 'HEAD'))
                         ui.write('Tag%s: %s \n' % (['', 's'][len(cs.tags)>1],
                                               ','.join(cs.tags) or '(none)'))
                         if opts["parents"] and cs.parents:
                             if len(cs.parents)>1:
                                 ui.write('Parents: %s\n' % (','.join([str(p.id) for p in cs.parents])))
                             else:
                                 ui.write('Parent: %d\n' % cs.parents[0].id)
                         if opts["ancestors"]:
                             b = cs.branch
                             r = []
                             while b:
                                 b, c = ancestors[b]
                                 r.append('%s:%d:%d' % (b or "HEAD", c, branches[b]))
                             if r:
                                 ui.write('Ancestors: %s\n' % (','.join(r)))
                         ui.write('Log:\n')
                         ui.write('%s\n\n' % cs.comment)
                         ui.write('Members: \n')
                         for f in cs.entries:
                             fn = f.file
                             if fn.startswith(opts["prefix"]):
                                 fn = fn[len(opts["prefix"]):]
                             ui.write('\t%s:%s->%s%s \n' % (fn, '.'.join([str(x) for x in f.parent]) or 'INITIAL',
                                                       '.'.join([str(x) for x in f.revision]), ['', '(DEAD)'][f.dead]))
                         ui.write('\n')
                     # have we seen the start tag?
                     if revisions and off:
                         if revisions[0] == str(cs.id) or \
                             revisions[0] in cs.tags:
                             off = False
                     # see if we reached the end tag
                     if len(revisions)>1 and not off:
                         if revisions[1] == str(cs.id) or \
                             revisions[1] in cs.tags:
                             break