upstream/mercurial-mirror Commit - r43322:3b8a4587

1

# Mercurial built-in replacement for cvsps.

1

# Mercurial built-in replacement for cvsps.

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

from __future__ import absolute_import

7

from __future__ import absolute_import

8

9

import functools

9

import functools

10

import os

10

import os

11

import re

11

import re

12

13

from mercurial.i18n import _

13

from mercurial.i18n import _

14

from mercurial import (

14

from mercurial import (

15

encoding,

15

encoding,

16

error,

16

error,

17

hook,

17

hook,

18

pycompat,

18

pycompat,

19

util,

19

util,

20

)

20

)

21

from mercurial.utils import (

21

from mercurial.utils import (

22

dateutil,

22

dateutil,

23

procutil,

23

procutil,

24

stringutil,

24

stringutil,

25

)

25

)

26

27

pickle = util.pickle

27

pickle = util.pickle

28

29

class logentry(object):

29

class logentry(object):

30

'''Class logentry has the following attributes:

30

'''Class logentry has the following attributes:

31

.author - author name as CVS knows it

31

.author - author name as CVS knows it

32

.branch - name of branch this revision is on

32

.branch - name of branch this revision is on

33

.branches - revision tuple of branches starting at this revision

33

.branches - revision tuple of branches starting at this revision

34

.comment - commit message

34

.comment - commit message

35

.commitid - CVS commitid or None

35

.commitid - CVS commitid or None

36

.date - the commit date as a (time, tz) tuple

36

.date - the commit date as a (time, tz) tuple

37

.dead - true if file revision is dead

37

.dead - true if file revision is dead

38

.file - Name of file

38

.file - Name of file

39

.lines - a tuple (+lines, -lines) or None

39

.lines - a tuple (+lines, -lines) or None

40

.parent - Previous revision of this entry

40

.parent - Previous revision of this entry

41

.rcs - name of file as returned from CVS

41

.rcs - name of file as returned from CVS

42

.revision - revision number as tuple

42

.revision - revision number as tuple

43

.tags - list of tags on the file

43

.tags - list of tags on the file

44

.synthetic - is this a synthetic "file ... added on ..." revision?

44

.synthetic - is this a synthetic "file ... added on ..." revision?

45

.mergepoint - the branch that has been merged from (if present in

45

.mergepoint - the branch that has been merged from (if present in

46

rlog output) or None

46

rlog output) or None

47

.branchpoints - the branches that start at the current entry or empty

47

.branchpoints - the branches that start at the current entry or empty

48

'''

48

'''

49

def __init__(self, **entries):

49

def __init__(self, **entries):

50

self.synthetic = False

50

self.synthetic = False

51

self.__dict__.update(entries)

51

self.__dict__.update(entries)

52

53

def __repr__(self):

53

def __repr__(self):

54

items = (r"%s=%r"%(k, self.__dict__[k]) for k in sorted(self.__dict__))

54

items = (r"%s=%r"%(k, self.__dict__[k]) for k in sorted(self.__dict__))

55

return r"%s(%s)"%(type(self).__name__, r", ".join(items))

55

return r"%s(%s)"%(type(self).__name__, r", ".join(items))

56

57

class logerror(Exception):

57

class logerror(Exception):

58

pass

58

pass

59

60

def getrepopath(cvspath):

60

def getrepopath(cvspath):

61

"""Return the repository path from a CVS path.

61

"""Return the repository path from a CVS path.

62

63

>>> getrepopath(b'/foo/bar')

63

>>> getrepopath(b'/foo/bar')

64

'/foo/bar'

64

'/foo/bar'

65

>>> getrepopath(b'c:/foo/bar')

65

>>> getrepopath(b'c:/foo/bar')

66

'/foo/bar'

66

'/foo/bar'

67

>>> getrepopath(b':pserver:10/foo/bar')

67

>>> getrepopath(b':pserver:10/foo/bar')

68

'/foo/bar'

68

'/foo/bar'

69

>>> getrepopath(b':pserver:10c:/foo/bar')

69

>>> getrepopath(b':pserver:10c:/foo/bar')

70

'/foo/bar'

70

'/foo/bar'

71

>>> getrepopath(b':pserver:/foo/bar')

71

>>> getrepopath(b':pserver:/foo/bar')

72

'/foo/bar'

72

'/foo/bar'

73

>>> getrepopath(b':pserver:c:/foo/bar')

73

>>> getrepopath(b':pserver:c:/foo/bar')

74

'/foo/bar'

74

'/foo/bar'

75

>>> getrepopath(b':pserver:truc@foo.bar:/foo/bar')

75

>>> getrepopath(b':pserver:truc@foo.bar:/foo/bar')

76

'/foo/bar'

76

'/foo/bar'

77

>>> getrepopath(b':pserver:truc@foo.bar:c:/foo/bar')

77

>>> getrepopath(b':pserver:truc@foo.bar:c:/foo/bar')

78

'/foo/bar'

78

'/foo/bar'

79

>>> getrepopath(b'user@server/path/to/repository')

79

>>> getrepopath(b'user@server/path/to/repository')

80

'/path/to/repository'

80

'/path/to/repository'

81

"""

81

"""

82

# According to CVS manual, CVS paths are expressed like:

82

# According to CVS manual, CVS paths are expressed like:

83

# [:method:][[user][:password]@]hostname[:[port]]/path/to/repository

83

# [:method:][[user][:password]@]hostname[:[port]]/path/to/repository

84

#

84

#

85

# CVSpath is splitted into parts and then position of the first occurrence

85

# CVSpath is splitted into parts and then position of the first occurrence

86

# of the '/' char after the '@' is located. The solution is the rest of the

86

# of the '/' char after the '@' is located. The solution is the rest of the

87

# string after that '/' sign including it

87

# string after that '/' sign including it

88

89

parts = cvspath.split(':')

89

parts = cvspath.split(':')

90

atposition = parts[-1].find('@')

90

atposition = parts[-1].find('@')

91

start = 0

91

start = 0

92

93

if atposition != -1:

93

if atposition != -1:

94

start = atposition

94

start = atposition

95

96

repopath = parts[-1][parts[-1].find('/', start):]

96

repopath = parts[-1][parts[-1].find('/', start):]

97

return repopath

97

return repopath

98

99

def createlog(ui, directory=None, root="", rlog=True, cache=None):

99

def createlog(ui, directory=None, root="", rlog=True, cache=None):

100

'''Collect the CVS rlog'''

100

'''Collect the CVS rlog'''

101

102

# Because we store many duplicate commit log messages, reusing strings

102

# Because we store many duplicate commit log messages, reusing strings

103

# saves a lot of memory and pickle storage space.

103

# saves a lot of memory and pickle storage space.

104

_scache = {}

104

_scache = {}

105

def scache(s):

105

def scache(s):

106

"return a shared version of a string"

106

"return a shared version of a string"

107

return _scache.setdefault(s, s)

107

return _scache.setdefault(s, s)

108

109

ui.status(_('collecting CVS rlog\n'))

109

ui.status(_('collecting CVS rlog\n'))

110

111

log = [] # list of logentry objects containing the CVS state

111

log = [] # list of logentry objects containing the CVS state

112

113

# patterns to match in CVS (r)log output, by state of use

113

# patterns to match in CVS (r)log output, by state of use

114

re_00 = re.compile(b'RCS file: (.+)$')

114

re_00 = re.compile(b'RCS file: (.+)$')

115

re_01 = re.compile(b'cvs \\[r?log aborted\\]: (.+)$')

115

re_01 = re.compile(b'cvs \\[r?log aborted\\]: (.+)$')

116

re_02 = re.compile(b'cvs (r?log|server): (.+)\n$')

116

re_02 = re.compile(b'cvs (r?log|server): (.+)\n$')

117

re_03 = re.compile(b"(Cannot access.+CVSROOT)|"

117

re_03 = re.compile(b"(Cannot access.+CVSROOT)|"

118

b"(can't create temporary directory.+)$")

118

b"(can't create temporary directory.+)$")

119

re_10 = re.compile(b'Working file: (.+)$')

119

re_10 = re.compile(b'Working file: (.+)$')

120

re_20 = re.compile(b'symbolic names:')

120

re_20 = re.compile(b'symbolic names:')

121

re_30 = re.compile(b'\t(.+): ([\\d.]+)$')

121

re_30 = re.compile(b'\t(.+): ([\\d.]+)$')

122

re_31 = re.compile(b'----------------------------$')

122

re_31 = re.compile(b'----------------------------$')

123

re_32 = re.compile(b'======================================='

123

re_32 = re.compile(b'======================================='

124

b'======================================$')

124

b'======================================$')

125

re_50 = re.compile(br'revision ([\d.]+)(\s+locked by:\s+.+;)?$')

125

re_50 = re.compile(br'revision ([\d.]+)(\s+locked by:\s+.+;)?$')

126

re_60 = re.compile(br'date:\s+(.+);\s+author:\s+(.+);\s+state:\s+(.+?);'

126

re_60 = re.compile(br'date:\s+(.+);\s+author:\s+(.+);\s+state:\s+(.+?);'

127

br'(\s+lines:\s+(\+\d+)?\s+(-\d+)?;)?'

127

br'(\s+lines:\s+(\+\d+)?\s+(-\d+)?;)?'

128

br'(\s+commitid:\s+([^;]+);)?'

128

br'(\s+commitid:\s+([^;]+);)?'

129

br'(.*mergepoint:\s+([^;]+);)?')

129

br'(.*mergepoint:\s+([^;]+);)?')

130

re_70 = re.compile(b'branches: (.+);$')

130

re_70 = re.compile(b'branches: (.+);$')

131

132

file_added_re = re.compile(br'file [^/]+ was (initially )?added on branch')

132

file_added_re = re.compile(br'file [^/]+ was (initially )?added on branch')

133

134

prefix = '' # leading path to strip of what we get from CVS

134

prefix = '' # leading path to strip of what we get from CVS

135

136

if directory is None:

136

if directory is None:

137

# Current working directory

137

# Current working directory

138

139

# Get the real directory in the repository

139

# Get the real directory in the repository

140

try:

140

try:

141

~~prefix~~ = open(os.path.join('CVS','Repository'), 'rb').~~read~~().~~strip~~()

141

with open(os.path.join(b'CVS', b'Repository'), 'rb') as f:

142

prefix = f.read().strip()

142

directory = prefix

143

directory = prefix

143

if prefix == ".":

144

if prefix == ".":

144

prefix = ""

145

prefix = ""

145

except IOError:

146

except IOError:

146

raise logerror(_('not a CVS sandbox'))

147

raise logerror(_('not a CVS sandbox'))

147

148

if prefix and not prefix.endswith(pycompat.ossep):

149

if prefix and not prefix.endswith(pycompat.ossep):

149

prefix += pycompat.ossep

150

prefix += pycompat.ossep

150

151

# Use the Root file in the sandbox, if it exists

152

# Use the Root file in the sandbox, if it exists

152

try:

153

try:

153

root = open(os.path.join('CVS','Root'), 'rb').read().strip()

154

root = open(os.path.join('CVS','Root'), 'rb').read().strip()

154

except IOError:

155

except IOError:

155

pass

156

pass

156

157

if not root:

158

if not root:

158

root = encoding.environ.get('CVSROOT', '')

159

root = encoding.environ.get('CVSROOT', '')

159

160

# read log cache if one exists

161

# read log cache if one exists

161

oldlog = []

162

oldlog = []

162

date = None

163

date = None

163

164

if cache:

165

if cache:

165

cachedir = os.path.expanduser('~/.hg.cvsps')

166

cachedir = os.path.expanduser('~/.hg.cvsps')

166

if not os.path.exists(cachedir):

167

if not os.path.exists(cachedir):

167

os.mkdir(cachedir)

168

os.mkdir(cachedir)

168

169

# The cvsps cache pickle needs a uniquified name, based on the

170

# The cvsps cache pickle needs a uniquified name, based on the

170

# repository location. The address may have all sort of nasties

171

# repository location. The address may have all sort of nasties

171

# in it, slashes, colons and such. So here we take just the

172

# in it, slashes, colons and such. So here we take just the

172

# alphanumeric characters, concatenated in a way that does not

173

# alphanumeric characters, concatenated in a way that does not

173

# mix up the various components, so that

174

# mix up the various components, so that

174

# :pserver:user@server:/path

175

# :pserver:user@server:/path

175

# and

176

# and

176

# /pserver/user/server/path

177

# /pserver/user/server/path

177

# are mapped to different cache file names.

178

# are mapped to different cache file names.

178

cachefile = root.split(":") + [directory, "cache"]

179

cachefile = root.split(":") + [directory, "cache"]

179

cachefile = ['-'.join(re.findall(br'\w+', s)) for s in cachefile if s]

180

cachefile = ['-'.join(re.findall(br'\w+', s)) for s in cachefile if s]

180

cachefile = os.path.join(cachedir,

181

cachefile = os.path.join(cachedir,

181

'.'.join([s for s in cachefile if s]))

182

'.'.join([s for s in cachefile if s]))

182

183

if cache == 'update':

184

if cache == 'update':

184

try:

185

try:

185

ui.note(_('reading cvs log cache %s\n') % cachefile)

186

ui.note(_('reading cvs log cache %s\n') % cachefile)

186

oldlog = pickle.load(open(cachefile, 'rb'))

187

oldlog = pickle.load(open(cachefile, 'rb'))

187

for e in oldlog:

188

for e in oldlog:

188

if not (util.safehasattr(e, 'branchpoints') and

189

if not (util.safehasattr(e, 'branchpoints') and

189

util.safehasattr(e, 'commitid') and

190

util.safehasattr(e, 'commitid') and

190

util.safehasattr(e, 'mergepoint')):

191

util.safehasattr(e, 'mergepoint')):

191

ui.status(_('ignoring old cache\n'))

192

ui.status(_('ignoring old cache\n'))

192

oldlog = []

193

oldlog = []

193

break

194

break

194

195

ui.note(_('cache has %d log entries\n') % len(oldlog))

196

ui.note(_('cache has %d log entries\n') % len(oldlog))

196

except Exception as e:

197

except Exception as e:

197

ui.note(_('error reading cache: %r\n') % e)

198

ui.note(_('error reading cache: %r\n') % e)

198

199

if oldlog:

200

if oldlog:

200

date = oldlog[-1].date # last commit date as a (time,tz) tuple

201

date = oldlog[-1].date # last commit date as a (time,tz) tuple

201

date = dateutil.datestr(date, '%Y/%m/%d %H:%M:%S %1%2')

202

date = dateutil.datestr(date, '%Y/%m/%d %H:%M:%S %1%2')

202

203

# build the CVS commandline

204

# build the CVS commandline

204

cmd = ['cvs', '-q']

205

cmd = ['cvs', '-q']

205

if root:

206

if root:

206

cmd.append('-d%s' % root)

207

cmd.append('-d%s' % root)

207

p = util.normpath(getrepopath(root))

208

p = util.normpath(getrepopath(root))

208

if not p.endswith('/'):

209

if not p.endswith('/'):

209

p += '/'

210

p += '/'

210

if prefix:

211

if prefix:

211

# looks like normpath replaces "" by "."

212

# looks like normpath replaces "" by "."

212

prefix = p + util.normpath(prefix)

213

prefix = p + util.normpath(prefix)

213

else:

214

else:

214

prefix = p

215

prefix = p

215

cmd.append(['log', 'rlog'][rlog])

216

cmd.append(['log', 'rlog'][rlog])

216

if date:

217

if date:

217

# no space between option and date string

218

# no space between option and date string

218

cmd.append('-d>%s' % date)

219

cmd.append('-d>%s' % date)

219

cmd.append(directory)

220

cmd.append(directory)

220

221

# state machine begins here

222

# state machine begins here

222

tags = {} # dictionary of revisions on current file with their tags

223

tags = {} # dictionary of revisions on current file with their tags

223

branchmap = {} # mapping between branch names and revision numbers

224

branchmap = {} # mapping between branch names and revision numbers

224

rcsmap = {}

225

rcsmap = {}

225

state = 0

226

state = 0

226

store = False # set when a new record can be appended

227

store = False # set when a new record can be appended

227

228

cmd = [procutil.shellquote(arg) for arg in cmd]

229

cmd = [procutil.shellquote(arg) for arg in cmd]

229

ui.note(_("running %s\n") % (' '.join(cmd)))

230

ui.note(_("running %s\n") % (' '.join(cmd)))

230

ui.debug("prefix=%r directory=%r root=%r\n" % (prefix, directory, root))

231

ui.debug("prefix=%r directory=%r root=%r\n" % (prefix, directory, root))

231

232

pfp = procutil.popen(' '.join(cmd), 'rb')

233

pfp = procutil.popen(' '.join(cmd), 'rb')

233

peek = util.fromnativeeol(pfp.readline())

234

peek = util.fromnativeeol(pfp.readline())

234

while True:

235

while True:

235

line = peek

236

line = peek

236

if line == '':

237

if line == '':

237

break

238

break

238

peek = util.fromnativeeol(pfp.readline())

239

peek = util.fromnativeeol(pfp.readline())

239

if line.endswith('\n'):

240

if line.endswith('\n'):

240

line = line[:-1]

241

line = line[:-1]

241

#ui.debug('state=%d line=%r\n' % (state, line))

242

#ui.debug('state=%d line=%r\n' % (state, line))

242

243

if state == 0:

244

if state == 0:

244

# initial state, consume input until we see 'RCS file'

245

# initial state, consume input until we see 'RCS file'

245

match = re_00.match(line)

246

match = re_00.match(line)

246

if match:

247

if match:

247

rcs = match.group(1)

248

rcs = match.group(1)

248

tags = {}

249

tags = {}

249

if rlog:

250

if rlog:

250

filename = util.normpath(rcs[:-2])

251

filename = util.normpath(rcs[:-2])

251

if filename.startswith(prefix):

252

if filename.startswith(prefix):

252

filename = filename[len(prefix):]

253

filename = filename[len(prefix):]

253

if filename.startswith('/'):

254

if filename.startswith('/'):

254

filename = filename[1:]

255

filename = filename[1:]

255

if filename.startswith('Attic/'):

256

if filename.startswith('Attic/'):

256

filename = filename[6:]

257

filename = filename[6:]

257

else:

258

else:

258

filename = filename.replace('/Attic/', '/')

259

filename = filename.replace('/Attic/', '/')

259

state = 2

260

state = 2

260

continue

261

continue

261

state = 1

262

state = 1

262

continue

263

continue

263

match = re_01.match(line)

264

match = re_01.match(line)

264

if match:

265

if match:

265

raise logerror(match.group(1))

266

raise logerror(match.group(1))

266

match = re_02.match(line)

267

match = re_02.match(line)

267

if match:

268

if match:

268

raise logerror(match.group(2))

269

raise logerror(match.group(2))

269

if re_03.match(line):

270

if re_03.match(line):

270

raise logerror(line)

271

raise logerror(line)

271

272

elif state == 1:

273

elif state == 1:

273

# expect 'Working file' (only when using log instead of rlog)

274

# expect 'Working file' (only when using log instead of rlog)

274

match = re_10.match(line)

275

match = re_10.match(line)

275

assert match, _('RCS file must be followed by working file')

276

assert match, _('RCS file must be followed by working file')

276

filename = util.normpath(match.group(1))

277

filename = util.normpath(match.group(1))

277

state = 2

278

state = 2

278

279

elif state == 2:

280

elif state == 2:

280

# expect 'symbolic names'

281

# expect 'symbolic names'

281

if re_20.match(line):

282

if re_20.match(line):

282

branchmap = {}

283

branchmap = {}

283

state = 3

284

state = 3

284

285

elif state == 3:

286

elif state == 3:

286

# read the symbolic names and store as tags

287

# read the symbolic names and store as tags

287

match = re_30.match(line)

288

match = re_30.match(line)

288

if match:

289

if match:

289

rev = [int(x) for x in match.group(2).split('.')]

290

rev = [int(x) for x in match.group(2).split('.')]

290

291

# Convert magic branch number to an odd-numbered one

292

# Convert magic branch number to an odd-numbered one

292

revn = len(rev)

293

revn = len(rev)

293

if revn > 3 and (revn % 2) == 0 and rev[-2] == 0:

294

if revn > 3 and (revn % 2) == 0 and rev[-2] == 0:

294

rev = rev[:-2] + rev[-1:]

295

rev = rev[:-2] + rev[-1:]

295

rev = tuple(rev)

296

rev = tuple(rev)

296

297

if rev not in tags:

298

if rev not in tags:

298

tags[rev] = []

299

tags[rev] = []

299

tags[rev].append(match.group(1))

300

tags[rev].append(match.group(1))

300

branchmap[match.group(1)] = match.group(2)

301

branchmap[match.group(1)] = match.group(2)

301

302

elif re_31.match(line):

303

elif re_31.match(line):

303

state = 5

304

state = 5

304

elif re_32.match(line):

305

elif re_32.match(line):

305

state = 0

306

state = 0

306

307

elif state == 4:

308

elif state == 4:

308

# expecting '------' separator before first revision

309

# expecting '------' separator before first revision

309

if re_31.match(line):

310

if re_31.match(line):

310

state = 5

311

state = 5

311

else:

312

else:

312

assert not re_32.match(line), _('must have at least '

313

assert not re_32.match(line), _('must have at least '

313

'some revisions')

314

'some revisions')

314

315

elif state == 5:

316

elif state == 5:

316

# expecting revision number and possibly (ignored) lock indication

317

# expecting revision number and possibly (ignored) lock indication

317

# we create the logentry here from values stored in states 0 to 4,

318

# we create the logentry here from values stored in states 0 to 4,

318

# as this state is re-entered for subsequent revisions of a file.

319

# as this state is re-entered for subsequent revisions of a file.

319

match = re_50.match(line)

320

match = re_50.match(line)

320

assert match, _('expected revision number')

321

assert match, _('expected revision number')

321

e = logentry(rcs=scache(rcs),

322

e = logentry(rcs=scache(rcs),

322

file=scache(filename),

323

file=scache(filename),

323

revision=tuple([int(x) for x in

324

revision=tuple([int(x) for x in

324

match.group(1).split('.')]),

325

match.group(1).split('.')]),

325

branches=[],

326

branches=[],

326

parent=None,

327

parent=None,

327

commitid=None,

328

commitid=None,

328

mergepoint=None,

329

mergepoint=None,

329

branchpoints=set())

330

branchpoints=set())

330

331

state = 6

332

state = 6

332

333

elif state == 6:

334

elif state == 6:

334

# expecting date, author, state, lines changed

335

# expecting date, author, state, lines changed

335

match = re_60.match(line)

336

match = re_60.match(line)

336

assert match, _('revision must be followed by date line')

337

assert match, _('revision must be followed by date line')

337

d = match.group(1)

338

d = match.group(1)

338

if d[2] == '/':

339

if d[2] == '/':

339

# Y2K

340

# Y2K

340

d = '19' + d

341

d = '19' + d

341

342

if len(d.split()) != 3:

343

if len(d.split()) != 3:

343

# cvs log dates always in GMT

344

# cvs log dates always in GMT

344

d = d + ' UTC'

345

d = d + ' UTC'

345

e.date = dateutil.parsedate(d, ['%y/%m/%d %H:%M:%S',

346

e.date = dateutil.parsedate(d, ['%y/%m/%d %H:%M:%S',

346

'%Y/%m/%d %H:%M:%S',

347

'%Y/%m/%d %H:%M:%S',

347

'%Y-%m-%d %H:%M:%S'])

348

'%Y-%m-%d %H:%M:%S'])

348

e.author = scache(match.group(2))

349

e.author = scache(match.group(2))

349

e.dead = match.group(3).lower() == 'dead'

350

e.dead = match.group(3).lower() == 'dead'

350

351

if match.group(5):

352

if match.group(5):

352

if match.group(6):

353

if match.group(6):

353

e.lines = (int(match.group(5)), int(match.group(6)))

354

e.lines = (int(match.group(5)), int(match.group(6)))

354

else:

355

else:

355

e.lines = (int(match.group(5)), 0)

356

e.lines = (int(match.group(5)), 0)

356

elif match.group(6):

357

elif match.group(6):

357

e.lines = (0, int(match.group(6)))

358

e.lines = (0, int(match.group(6)))

358

else:

359

else:

359

e.lines = None

360

e.lines = None

360

361

if match.group(7): # cvs 1.12 commitid

362

if match.group(7): # cvs 1.12 commitid

362

e.commitid = match.group(8)

363

e.commitid = match.group(8)

363

364

if match.group(9): # cvsnt mergepoint

365

if match.group(9): # cvsnt mergepoint

365

myrev = match.group(10).split('.')

366

myrev = match.group(10).split('.')

366

if len(myrev) == 2: # head

367

if len(myrev) == 2: # head

367

e.mergepoint = 'HEAD'

368

e.mergepoint = 'HEAD'

368

else:

369

else:

369

myrev = '.'.join(myrev[:-2] + ['0', myrev[-2]])

370

myrev = '.'.join(myrev[:-2] + ['0', myrev[-2]])

370

branches = [b for b in branchmap if branchmap[b] == myrev]

371

branches = [b for b in branchmap if branchmap[b] == myrev]

371

assert len(branches) == 1, ('unknown branch: %s'

372

assert len(branches) == 1, ('unknown branch: %s'

372

% e.mergepoint)

373

% e.mergepoint)

373

e.mergepoint = branches[0]

374

e.mergepoint = branches[0]

374

375

e.comment = []

376

e.comment = []

376

state = 7

377

state = 7

377

378

elif state == 7:

379

elif state == 7:

379

# read the revision numbers of branches that start at this revision

380

# read the revision numbers of branches that start at this revision

380

# or store the commit log message otherwise

381

# or store the commit log message otherwise

381

m = re_70.match(line)

382

m = re_70.match(line)

382

if m:

383

if m:

383

e.branches = [tuple([int(y) for y in x.strip().split('.')])

384

e.branches = [tuple([int(y) for y in x.strip().split('.')])

384

for x in m.group(1).split(';')]

385

for x in m.group(1).split(';')]

385

state = 8

386

state = 8

386

elif re_31.match(line) and re_50.match(peek):

387

elif re_31.match(line) and re_50.match(peek):

387

state = 5

388

state = 5

388

store = True

389

store = True

389

elif re_32.match(line):

390

elif re_32.match(line):

390

state = 0

391

state = 0

391

store = True

392

store = True

392

else:

393

else:

393

e.comment.append(line)

394

e.comment.append(line)

394

395

elif state == 8:

396

elif state == 8:

396

# store commit log message

397

# store commit log message

397

if re_31.match(line):

398

if re_31.match(line):

398

cpeek = peek

399

cpeek = peek

399

if cpeek.endswith('\n'):

400

if cpeek.endswith('\n'):

400

cpeek = cpeek[:-1]

401

cpeek = cpeek[:-1]

401

if re_50.match(cpeek):

402

if re_50.match(cpeek):

402

state = 5

403

state = 5

403

store = True

404

store = True

404

else:

405

else:

405

e.comment.append(line)

406

e.comment.append(line)

406

elif re_32.match(line):

407

elif re_32.match(line):

407

state = 0

408

state = 0

408

store = True

409

store = True

409

else:

410

else:

410

e.comment.append(line)

411

e.comment.append(line)

411

412

# When a file is added on a branch B1, CVS creates a synthetic

413

# When a file is added on a branch B1, CVS creates a synthetic

413

# dead trunk revision 1.1 so that the branch has a root.

414

# dead trunk revision 1.1 so that the branch has a root.

414

# Likewise, if you merge such a file to a later branch B2 (one

415

# Likewise, if you merge such a file to a later branch B2 (one

415

# that already existed when the file was added on B1), CVS

416

# that already existed when the file was added on B1), CVS

416

# creates a synthetic dead revision 1.1.x.1 on B2. Don't drop

417

# creates a synthetic dead revision 1.1.x.1 on B2. Don't drop

417

# these revisions now, but mark them synthetic so

418

# these revisions now, but mark them synthetic so

418

# createchangeset() can take care of them.

419

# createchangeset() can take care of them.

419

if (store and

420

if (store and

420

e.dead and

421

e.dead and

421

e.revision[-1] == 1 and # 1.1 or 1.1.x.1

422

e.revision[-1] == 1 and # 1.1 or 1.1.x.1

422

len(e.comment) == 1 and

423

len(e.comment) == 1 and

423

file_added_re.match(e.comment[0])):

424

file_added_re.match(e.comment[0])):

424

ui.debug('found synthetic revision in %s: %r\n'

425

ui.debug('found synthetic revision in %s: %r\n'

425

% (e.rcs, e.comment[0]))

426

% (e.rcs, e.comment[0]))

426

e.synthetic = True

427

e.synthetic = True

427

428

if store:

429

if store:

429

# clean up the results and save in the log.

430

# clean up the results and save in the log.

430

store = False

431

store = False

431

e.tags = sorted([scache(x) for x in tags.get(e.revision, [])])

432

e.tags = sorted([scache(x) for x in tags.get(e.revision, [])])

432

e.comment = scache('\n'.join(e.comment))

433

e.comment = scache('\n'.join(e.comment))

433

434

revn = len(e.revision)

435

revn = len(e.revision)

435

if revn > 3 and (revn % 2) == 0:

436

if revn > 3 and (revn % 2) == 0:

436

e.branch = tags.get(e.revision[:-1], [None])[0]

437

e.branch = tags.get(e.revision[:-1], [None])[0]

437

else:

438

else:

438

e.branch = None

439

e.branch = None

439

440

# find the branches starting from this revision

441

# find the branches starting from this revision

441

branchpoints = set()

442

branchpoints = set()

442

for branch, revision in branchmap.iteritems():

443

for branch, revision in branchmap.iteritems():

443

revparts = tuple([int(i) for i in revision.split('.')])

444

revparts = tuple([int(i) for i in revision.split('.')])

444

if len(revparts) < 2: # bad tags

445

if len(revparts) < 2: # bad tags

445

continue

446

continue

446

if revparts[-2] == 0 and revparts[-1] % 2 == 0:

447

if revparts[-2] == 0 and revparts[-1] % 2 == 0:

447

# normal branch

448

# normal branch

448

if revparts[:-2] == e.revision:

449

if revparts[:-2] == e.revision:

449

branchpoints.add(branch)

450

branchpoints.add(branch)

450

elif revparts == (1, 1, 1): # vendor branch

451

elif revparts == (1, 1, 1): # vendor branch

451

if revparts in e.branches:

452

if revparts in e.branches:

452

branchpoints.add(branch)

453

branchpoints.add(branch)

453

e.branchpoints = branchpoints

454

e.branchpoints = branchpoints

454

455

log.append(e)

456

log.append(e)

456

457

rcsmap[e.rcs.replace('/Attic/', '/')] = e.rcs

458

rcsmap[e.rcs.replace('/Attic/', '/')] = e.rcs

458

459

if len(log) % 100 == 0:

460

if len(log) % 100 == 0:

460

ui.status(stringutil.ellipsis('%d %s' % (len(log), e.file), 80)

461

ui.status(stringutil.ellipsis('%d %s' % (len(log), e.file), 80)

461

+ '\n')

462

+ '\n')

462

463

log.sort(key=lambda x: (x.rcs, x.revision))

464

log.sort(key=lambda x: (x.rcs, x.revision))

464

465

# find parent revisions of individual files

466

# find parent revisions of individual files

466

versions = {}

467

versions = {}

467

for e in sorted(oldlog, key=lambda x: (x.rcs, x.revision)):

468

for e in sorted(oldlog, key=lambda x: (x.rcs, x.revision)):

468

rcs = e.rcs.replace('/Attic/', '/')

469

rcs = e.rcs.replace('/Attic/', '/')

469

if rcs in rcsmap:

470

if rcs in rcsmap:

470

e.rcs = rcsmap[rcs]

471

e.rcs = rcsmap[rcs]

471

branch = e.revision[:-1]

472

branch = e.revision[:-1]

472

versions[(e.rcs, branch)] = e.revision

473

versions[(e.rcs, branch)] = e.revision

473

474

for e in log:

475

for e in log:

475

branch = e.revision[:-1]

476

branch = e.revision[:-1]

476

p = versions.get((e.rcs, branch), None)

477

p = versions.get((e.rcs, branch), None)

477

if p is None:

478

if p is None:

478

p = e.revision[:-2]

479

p = e.revision[:-2]

479

e.parent = p

480

e.parent = p

480

versions[(e.rcs, branch)] = e.revision

481

versions[(e.rcs, branch)] = e.revision

481

482

# update the log cache

483

# update the log cache

483

if cache:

484

if cache:

484

if log:

485

if log:

485

# join up the old and new logs

486

# join up the old and new logs

486

log.sort(key=lambda x: x.date)

487

log.sort(key=lambda x: x.date)

487

488

if oldlog and oldlog[-1].date >= log[0].date:

489

if oldlog and oldlog[-1].date >= log[0].date:

489

raise logerror(_('log cache overlaps with new log entries,'

490

raise logerror(_('log cache overlaps with new log entries,'

490

' re-run without cache.'))

491

' re-run without cache.'))

491

492

log = oldlog + log

493

log = oldlog + log

493

494

# write the new cachefile

495

# write the new cachefile

495

ui.note(_('writing cvs log cache %s\n') % cachefile)

496

ui.note(_('writing cvs log cache %s\n') % cachefile)

496

pickle.dump(log, open(cachefile, 'wb'))

497

pickle.dump(log, open(cachefile, 'wb'))

497

else:

498

else:

498

log = oldlog

499

log = oldlog

499

500

ui.status(_('%d log entries\n') % len(log))

501

ui.status(_('%d log entries\n') % len(log))

501

502

encodings = ui.configlist('convert', 'cvsps.logencoding')

503

encodings = ui.configlist('convert', 'cvsps.logencoding')

503

if encodings:

504

if encodings:

504

def revstr(r):

505

def revstr(r):

505

# this is needed, because logentry.revision is a tuple of "int"

506

# this is needed, because logentry.revision is a tuple of "int"

506

# (e.g. (1, 2) for "1.2")

507

# (e.g. (1, 2) for "1.2")

507

return '.'.join(pycompat.maplist(pycompat.bytestr, r))

508

return '.'.join(pycompat.maplist(pycompat.bytestr, r))

508

509

for entry in log:

510

for entry in log:

510

comment = entry.comment

511

comment = entry.comment

511

for e in encodings:

512

for e in encodings:

512

try:

513

try:

513

entry.comment = comment.decode(

514

entry.comment = comment.decode(

514

pycompat.sysstr(e)).encode('utf-8')

515

pycompat.sysstr(e)).encode('utf-8')

515

if ui.debugflag:

516

if ui.debugflag:

516

ui.debug("transcoding by %s: %s of %s\n" %

517

ui.debug("transcoding by %s: %s of %s\n" %

517

(e, revstr(entry.revision), entry.file))

518

(e, revstr(entry.revision), entry.file))

518

break

519

break

519

except UnicodeDecodeError:

520

except UnicodeDecodeError:

520

pass # try next encoding

521

pass # try next encoding

521

except LookupError as inst: # unknown encoding, maybe

522

except LookupError as inst: # unknown encoding, maybe

522

raise error.Abort(inst,

523

raise error.Abort(inst,

523

hint=_('check convert.cvsps.logencoding'

524

hint=_('check convert.cvsps.logencoding'

524

' configuration'))

525

' configuration'))

525

else:

526

else:

526

raise error.Abort(_("no encoding can transcode"

527

raise error.Abort(_("no encoding can transcode"

527

" CVS log message for %s of %s")

528

" CVS log message for %s of %s")

528

% (revstr(entry.revision), entry.file),

529

% (revstr(entry.revision), entry.file),

529

hint=_('check convert.cvsps.logencoding'

530

hint=_('check convert.cvsps.logencoding'

530

' configuration'))

531

' configuration'))

531

532

hook.hook(ui, None, "cvslog", True, log=log)

533

hook.hook(ui, None, "cvslog", True, log=log)

533

534

return log

535

return log

535

536

537

class changeset(object):

538

class changeset(object):

538

'''Class changeset has the following attributes:

539

'''Class changeset has the following attributes:

539

.id - integer identifying this changeset (list index)

540

.id - integer identifying this changeset (list index)

540

.author - author name as CVS knows it

541

.author - author name as CVS knows it

541

.branch - name of branch this changeset is on, or None

542

.branch - name of branch this changeset is on, or None

542

.comment - commit message

543

.comment - commit message

543

.commitid - CVS commitid or None

544

.commitid - CVS commitid or None

544

.date - the commit date as a (time,tz) tuple

545

.date - the commit date as a (time,tz) tuple

545

.entries - list of logentry objects in this changeset

546

.entries - list of logentry objects in this changeset

546

.parents - list of one or two parent changesets

547

.parents - list of one or two parent changesets

547

.tags - list of tags on this changeset

548

.tags - list of tags on this changeset

548

.synthetic - from synthetic revision "file ... added on branch ..."

549

.synthetic - from synthetic revision "file ... added on branch ..."

549

.mergepoint- the branch that has been merged from or None

550

.mergepoint- the branch that has been merged from or None

550

.branchpoints- the branches that start at the current entry or empty

551

.branchpoints- the branches that start at the current entry or empty

551

'''

552

'''

552

def __init__(self, **entries):

553

def __init__(self, **entries):

553

self.id = None

554

self.id = None

554

self.synthetic = False

555

self.synthetic = False

555

self.__dict__.update(entries)

556

self.__dict__.update(entries)

556

557

def __repr__(self):

558

def __repr__(self):

558

items = ("%s=%r"%(k, self.__dict__[k]) for k in sorted(self.__dict__))

559

items = ("%s=%r"%(k, self.__dict__[k]) for k in sorted(self.__dict__))

559

return "%s(%s)"%(type(self).__name__, ", ".join(items))

560

return "%s(%s)"%(type(self).__name__, ", ".join(items))

560

561

def createchangeset(ui, log, fuzz=60, mergefrom=None, mergeto=None):

562

def createchangeset(ui, log, fuzz=60, mergefrom=None, mergeto=None):

562

'''Convert log into changesets.'''

563

'''Convert log into changesets.'''

563

564

ui.status(_('creating changesets\n'))

565

ui.status(_('creating changesets\n'))

565

566

# try to order commitids by date

567

# try to order commitids by date

567

mindate = {}

568

mindate = {}

568

for e in log:

569

for e in log:

569

if e.commitid:

570

if e.commitid:

570

if e.commitid not in mindate:

571

if e.commitid not in mindate:

571

mindate[e.commitid] = e.date

572

mindate[e.commitid] = e.date

572

else:

573

else:

573

mindate[e.commitid] = min(e.date, mindate[e.commitid])

574

mindate[e.commitid] = min(e.date, mindate[e.commitid])

574

575

# Merge changesets

576

# Merge changesets

576

log.sort(key=lambda x: (mindate.get(x.commitid, (-1, 0)),

577

log.sort(key=lambda x: (mindate.get(x.commitid, (-1, 0)),

577

x.commitid or '', x.comment,

578

x.commitid or '', x.comment,

578

x.author, x.branch or '', x.date, x.branchpoints))

579

x.author, x.branch or '', x.date, x.branchpoints))

579

580

changesets = []

581

changesets = []

581

files = set()

582

files = set()

582

c = None

583

c = None

583

for i, e in enumerate(log):

584

for i, e in enumerate(log):

584

585

# Check if log entry belongs to the current changeset or not.

586

# Check if log entry belongs to the current changeset or not.

586

587

# Since CVS is file-centric, two different file revisions with

588

# Since CVS is file-centric, two different file revisions with

588

# different branchpoints should be treated as belonging to two

589

# different branchpoints should be treated as belonging to two

589

# different changesets (and the ordering is important and not

590

# different changesets (and the ordering is important and not

590

# honoured by cvsps at this point).

591

# honoured by cvsps at this point).

591

#

592

#

592

# Consider the following case:

593

# Consider the following case:

593

# foo 1.1 branchpoints: [MYBRANCH]

594

# foo 1.1 branchpoints: [MYBRANCH]

594

# bar 1.1 branchpoints: [MYBRANCH, MYBRANCH2]

595

# bar 1.1 branchpoints: [MYBRANCH, MYBRANCH2]

595

#

596

#

596

# Here foo is part only of MYBRANCH, but not MYBRANCH2, e.g. a

597

# Here foo is part only of MYBRANCH, but not MYBRANCH2, e.g. a

597

# later version of foo may be in MYBRANCH2, so foo should be the

598

# later version of foo may be in MYBRANCH2, so foo should be the

598

# first changeset and bar the next and MYBRANCH and MYBRANCH2

599

# first changeset and bar the next and MYBRANCH and MYBRANCH2

599

# should both start off of the bar changeset. No provisions are

600

# should both start off of the bar changeset. No provisions are

600

# made to ensure that this is, in fact, what happens.

601

# made to ensure that this is, in fact, what happens.

601

if not (c and e.branchpoints == c.branchpoints and

602

if not (c and e.branchpoints == c.branchpoints and

602

(# cvs commitids

603

(# cvs commitids

603

(e.commitid is not None and e.commitid == c.commitid) or

604

(e.commitid is not None and e.commitid == c.commitid) or

604

(# no commitids, use fuzzy commit detection

605

(# no commitids, use fuzzy commit detection

605

(e.commitid is None or c.commitid is None) and

606

(e.commitid is None or c.commitid is None) and

606

e.comment == c.comment and

607

e.comment == c.comment and

607

e.author == c.author and

608

e.author == c.author and

608

e.branch == c.branch and

609

e.branch == c.branch and

609

((c.date[0] + c.date[1]) <=

610

((c.date[0] + c.date[1]) <=

610

(e.date[0] + e.date[1]) <=

611

(e.date[0] + e.date[1]) <=

611

(c.date[0] + c.date[1]) + fuzz) and

612

(c.date[0] + c.date[1]) + fuzz) and

612

e.file not in files))):

613

e.file not in files))):

613

c = changeset(comment=e.comment, author=e.author,

614

c = changeset(comment=e.comment, author=e.author,

614

branch=e.branch, date=e.date,

615

branch=e.branch, date=e.date,

615

entries=[], mergepoint=e.mergepoint,

616

entries=[], mergepoint=e.mergepoint,

616

branchpoints=e.branchpoints, commitid=e.commitid)

617

branchpoints=e.branchpoints, commitid=e.commitid)

617

changesets.append(c)

618

changesets.append(c)

618

619

files = set()

620

files = set()

620

if len(changesets) % 100 == 0:

621

if len(changesets) % 100 == 0:

621

t = '%d %s' % (len(changesets), repr(e.comment)[1:-1])

622

t = '%d %s' % (len(changesets), repr(e.comment)[1:-1])

622

ui.status(stringutil.ellipsis(t, 80) + '\n')

623

ui.status(stringutil.ellipsis(t, 80) + '\n')

623

624

c.entries.append(e)

625

c.entries.append(e)

625

files.add(e.file)

626

files.add(e.file)

626

c.date = e.date # changeset date is date of latest commit in it

627

c.date = e.date # changeset date is date of latest commit in it

627

628

# Mark synthetic changesets

629

# Mark synthetic changesets

629

630

for c in changesets:

631

for c in changesets:

631

# Synthetic revisions always get their own changeset, because

632

# Synthetic revisions always get their own changeset, because

632

# the log message includes the filename. E.g. if you add file3

633

# the log message includes the filename. E.g. if you add file3

633

# and file4 on a branch, you get four log entries and three

634

# and file4 on a branch, you get four log entries and three

634

# changesets:

635

# changesets:

635

# "File file3 was added on branch ..." (synthetic, 1 entry)

636

# "File file3 was added on branch ..." (synthetic, 1 entry)

636

# "File file4 was added on branch ..." (synthetic, 1 entry)

637

# "File file4 was added on branch ..." (synthetic, 1 entry)

637

# "Add file3 and file4 to fix ..." (real, 2 entries)

638

# "Add file3 and file4 to fix ..." (real, 2 entries)

638

# Hence the check for 1 entry here.

639

# Hence the check for 1 entry here.

639

c.synthetic = len(c.entries) == 1 and c.entries[0].synthetic

640

c.synthetic = len(c.entries) == 1 and c.entries[0].synthetic

640

641

# Sort files in each changeset

642

# Sort files in each changeset

642

643

def entitycompare(l, r):

644

def entitycompare(l, r):

644

'Mimic cvsps sorting order'

645

'Mimic cvsps sorting order'

645

l = l.file.split('/')

646

l = l.file.split('/')

646

r = r.file.split('/')

647

r = r.file.split('/')

647

nl = len(l)

648

nl = len(l)

648

nr = len(r)

649

nr = len(r)

649

n = min(nl, nr)

650

n = min(nl, nr)

650

for i in range(n):

651

for i in range(n):

651

if i + 1 == nl and nl < nr:

652

if i + 1 == nl and nl < nr:

652

return -1

653

return -1

653

elif i + 1 == nr and nl > nr:

654

elif i + 1 == nr and nl > nr:

654

return +1

655

return +1

655

elif l[i] < r[i]:

656

elif l[i] < r[i]:

656

return -1

657

return -1

657

elif l[i] > r[i]:

658

elif l[i] > r[i]:

658

return +1

659

return +1

659

return 0

660

return 0

660

661

for c in changesets:

662

for c in changesets:

662

c.entries.sort(key=functools.cmp_to_key(entitycompare))

663

c.entries.sort(key=functools.cmp_to_key(entitycompare))

663

664

# Sort changesets by date

665

# Sort changesets by date

665

666

odd = set()

667

odd = set()

667

def cscmp(l, r):

668

def cscmp(l, r):

668

d = sum(l.date) - sum(r.date)

669

d = sum(l.date) - sum(r.date)

669

if d:

670

if d:

670

return d

671

return d

671

672

# detect vendor branches and initial commits on a branch

673

# detect vendor branches and initial commits on a branch

673

le = {}

674

le = {}

674

for e in l.entries:

675

for e in l.entries:

675

le[e.rcs] = e.revision

676

le[e.rcs] = e.revision

676

re = {}

677

re = {}

677

for e in r.entries:

678

for e in r.entries:

678

re[e.rcs] = e.revision

679

re[e.rcs] = e.revision

679

680

d = 0

681

d = 0

681

for e in l.entries:

682

for e in l.entries:

682

if re.get(e.rcs, None) == e.parent:

683

if re.get(e.rcs, None) == e.parent:

683

assert not d

684

assert not d

684

d = 1

685

d = 1

685

break

686

break

686

687

for e in r.entries:

688

for e in r.entries:

688

if le.get(e.rcs, None) == e.parent:

689

if le.get(e.rcs, None) == e.parent:

689

if d:

690

if d:

690

odd.add((l, r))

691

odd.add((l, r))

691

d = -1

692

d = -1

692

break

693

break

693

# By this point, the changesets are sufficiently compared that

694

# By this point, the changesets are sufficiently compared that

694

# we don't really care about ordering. However, this leaves

695

# we don't really care about ordering. However, this leaves

695

# some race conditions in the tests, so we compare on the

696

# some race conditions in the tests, so we compare on the

696

# number of files modified, the files contained in each

697

# number of files modified, the files contained in each

697

# changeset, and the branchpoints in the change to ensure test

698

# changeset, and the branchpoints in the change to ensure test

698

# output remains stable.

699

# output remains stable.

699

700

# recommended replacement for cmp from

701

# recommended replacement for cmp from

701

# https://docs.python.org/3.0/whatsnew/3.0.html

702

# https://docs.python.org/3.0/whatsnew/3.0.html

702

c = lambda x, y: (x > y) - (x < y)

703

c = lambda x, y: (x > y) - (x < y)

703

# Sort bigger changes first.

704

# Sort bigger changes first.

704

if not d:

705

if not d:

705

d = c(len(l.entries), len(r.entries))

706

d = c(len(l.entries), len(r.entries))

706

# Try sorting by filename in the change.

707

# Try sorting by filename in the change.

707

if not d:

708

if not d:

708

d = c([e.file for e in l.entries], [e.file for e in r.entries])

709

d = c([e.file for e in l.entries], [e.file for e in r.entries])

709

# Try and put changes without a branch point before ones with

710

# Try and put changes without a branch point before ones with

710

# a branch point.

711

# a branch point.

711

if not d:

712

if not d:

712

d = c(len(l.branchpoints), len(r.branchpoints))

713

d = c(len(l.branchpoints), len(r.branchpoints))

713

return d

714

return d

714

715

changesets.sort(key=functools.cmp_to_key(cscmp))

716

changesets.sort(key=functools.cmp_to_key(cscmp))

716

717

# Collect tags

718

# Collect tags

718

719

globaltags = {}

720

globaltags = {}

720

for c in changesets:

721

for c in changesets:

721

for e in c.entries:

722

for e in c.entries:

722

for tag in e.tags:

723

for tag in e.tags:

723

# remember which is the latest changeset to have this tag

724

# remember which is the latest changeset to have this tag

724

globaltags[tag] = c

725

globaltags[tag] = c

725

726

for c in changesets:

727

for c in changesets:

727

tags = set()

728

tags = set()

728

for e in c.entries:

729

for e in c.entries:

729

tags.update(e.tags)

730

tags.update(e.tags)

730

# remember tags only if this is the latest changeset to have it

731

# remember tags only if this is the latest changeset to have it

731

c.tags = sorted(tag for tag in tags if globaltags[tag] is c)

732

c.tags = sorted(tag for tag in tags if globaltags[tag] is c)

732

733

# Find parent changesets, handle {{mergetobranch BRANCHNAME}}

734

# Find parent changesets, handle {{mergetobranch BRANCHNAME}}

734

# by inserting dummy changesets with two parents, and handle

735

# by inserting dummy changesets with two parents, and handle

735

# {{mergefrombranch BRANCHNAME}} by setting two parents.

736

# {{mergefrombranch BRANCHNAME}} by setting two parents.

736

737

if mergeto is None:

738

if mergeto is None:

738

mergeto = br'{{mergetobranch ([-\w]+)}}'

739

mergeto = br'{{mergetobranch ([-\w]+)}}'

739

if mergeto:

740

if mergeto:

740

mergeto = re.compile(mergeto)

741

mergeto = re.compile(mergeto)

741

742

if mergefrom is None:

743

if mergefrom is None:

743

mergefrom = br'{{mergefrombranch ([-\w]+)}}'

744

mergefrom = br'{{mergefrombranch ([-\w]+)}}'

744

if mergefrom:

745

if mergefrom:

745

mergefrom = re.compile(mergefrom)

746

mergefrom = re.compile(mergefrom)

746

747

versions = {} # changeset index where we saw any particular file version

748

versions = {} # changeset index where we saw any particular file version

748

branches = {} # changeset index where we saw a branch

749

branches = {} # changeset index where we saw a branch

749

n = len(changesets)

750

n = len(changesets)

750

i = 0

751

i = 0

751

while i < n:

752

while i < n:

752

c = changesets[i]

753

c = changesets[i]

753

754

for f in c.entries:

755

for f in c.entries:

755

versions[(f.rcs, f.revision)] = i

756

versions[(f.rcs, f.revision)] = i

756

757

p = None

758

p = None

758

if c.branch in branches:

759

if c.branch in branches:

759

p = branches[c.branch]

760

p = branches[c.branch]

760

else:

761

else:

761

# first changeset on a new branch

762

# first changeset on a new branch

762

# the parent is a changeset with the branch in its

763

# the parent is a changeset with the branch in its

763

# branchpoints such that it is the latest possible

764

# branchpoints such that it is the latest possible

764

# commit without any intervening, unrelated commits.

765

# commit without any intervening, unrelated commits.

765

766

for candidate in pycompat.xrange(i):

767

for candidate in pycompat.xrange(i):

767

if c.branch not in changesets[candidate].branchpoints:

768

if c.branch not in changesets[candidate].branchpoints:

768

if p is not None:

769

if p is not None:

769

break

770

break

770

continue

771

continue

771

p = candidate

772

p = candidate

772

773

c.parents = []

774

c.parents = []

774

if p is not None:

775

if p is not None:

775

p = changesets[p]

776

p = changesets[p]

776

777

# Ensure no changeset has a synthetic changeset as a parent.

778

# Ensure no changeset has a synthetic changeset as a parent.

778

while p.synthetic:

779

while p.synthetic:

779

assert len(p.parents) <= 1, (

780

assert len(p.parents) <= 1, (

780

_('synthetic changeset cannot have multiple parents'))

781

_('synthetic changeset cannot have multiple parents'))

781

if p.parents:

782

if p.parents:

782

p = p.parents[0]

783

p = p.parents[0]

783

else:

784

else:

784

p = None

785

p = None

785

break

786

break

786

787

if p is not None:

788

if p is not None:

788

c.parents.append(p)

789

c.parents.append(p)

789

790

if c.mergepoint:

791

if c.mergepoint:

791

if c.mergepoint == 'HEAD':

792

if c.mergepoint == 'HEAD':

792

c.mergepoint = None

793

c.mergepoint = None

793

c.parents.append(changesets[branches[c.mergepoint]])

794

c.parents.append(changesets[branches[c.mergepoint]])

794

795

if mergefrom:

796

if mergefrom:

796

m = mergefrom.search(c.comment)

797

m = mergefrom.search(c.comment)

797

if m:

798

if m:

798

m = m.group(1)

799

m = m.group(1)

799

if m == 'HEAD':

800

if m == 'HEAD':

800

m = None

801

m = None

801

try:

802

try:

802

candidate = changesets[branches[m]]

803

candidate = changesets[branches[m]]

803

except KeyError:

804

except KeyError:

804

ui.warn(_("warning: CVS commit message references "

805

ui.warn(_("warning: CVS commit message references "

805

"non-existent branch %r:\n%s\n")

806

"non-existent branch %r:\n%s\n")

806

% (pycompat.bytestr(m), c.comment))

807

% (pycompat.bytestr(m), c.comment))

807

if m in branches and c.branch != m and not candidate.synthetic:

808

if m in branches and c.branch != m and not candidate.synthetic:

808

c.parents.append(candidate)

809

c.parents.append(candidate)

809

810

if mergeto:

811

if mergeto:

811

m = mergeto.search(c.comment)

812

m = mergeto.search(c.comment)

812

if m:

813

if m:

813

if m.groups():

814

if m.groups():

814

m = m.group(1)

815

m = m.group(1)

815

if m == 'HEAD':

816

if m == 'HEAD':

816

m = None

817

m = None

817

else:

818

else:

818

m = None # if no group found then merge to HEAD

819

m = None # if no group found then merge to HEAD

819

if m in branches and c.branch != m:

820

if m in branches and c.branch != m:

820

# insert empty changeset for merge

821

# insert empty changeset for merge

821

cc = changeset(

822

cc = changeset(

822

author=c.author, branch=m, date=c.date,

823

author=c.author, branch=m, date=c.date,

823

comment='convert-repo: CVS merge from branch %s'

824

comment='convert-repo: CVS merge from branch %s'

824

% c.branch,

825

% c.branch,

825

entries=[], tags=[],

826

entries=[], tags=[],

826

parents=[changesets[branches[m]], c])

827

parents=[changesets[branches[m]], c])

827

changesets.insert(i + 1, cc)

828

changesets.insert(i + 1, cc)

828

branches[m] = i + 1

829

branches[m] = i + 1

829

830

# adjust our loop counters now we have inserted a new entry

831

# adjust our loop counters now we have inserted a new entry

831

n += 1

832

n += 1

832

i += 2

833

i += 2

833

continue

834

continue

834

835

branches[c.branch] = i

836

branches[c.branch] = i

836

i += 1

837

i += 1

837

838

# Drop synthetic changesets (safe now that we have ensured no other

839

# Drop synthetic changesets (safe now that we have ensured no other

839

# changesets can have them as parents).

840

# changesets can have them as parents).

840

i = 0

841

i = 0

841

while i < len(changesets):

842

while i < len(changesets):

842

if changesets[i].synthetic:

843

if changesets[i].synthetic:

843

del changesets[i]

844

del changesets[i]

844

else:

845

else:

845

i += 1

846

i += 1

846

847

# Number changesets

848

# Number changesets

848

849

for i, c in enumerate(changesets):

850

for i, c in enumerate(changesets):

850

c.id = i + 1

851

c.id = i + 1

851

852

if odd:

853

if odd:

853

for l, r in odd:

854

for l, r in odd:

854

if l.id is not None and r.id is not None:

855

if l.id is not None and r.id is not None:

855

ui.warn(_('changeset %d is both before and after %d\n')

856

ui.warn(_('changeset %d is both before and after %d\n')

856

% (l.id, r.id))

857

% (l.id, r.id))

857

858

ui.status(_('%d changeset entries\n') % len(changesets))

859

ui.status(_('%d changeset entries\n') % len(changesets))

859

860

hook.hook(ui, None, "cvschangesets", True, changesets=changesets)

861

hook.hook(ui, None, "cvschangesets", True, changesets=changesets)

861

862

return changesets

863

return changesets

863

864

865

def debugcvsps(ui, *args, **opts):

866

def debugcvsps(ui, *args, **opts):

866

'''Read CVS rlog for current directory or named path in

867

'''Read CVS rlog for current directory or named path in

867

repository, and convert the log to changesets based on matching

868

repository, and convert the log to changesets based on matching

868

commit log entries and dates.

869

commit log entries and dates.

869

'''

870

'''

870

opts = pycompat.byteskwargs(opts)

871

opts = pycompat.byteskwargs(opts)

871

if opts["new_cache"]:

872

if opts["new_cache"]:

872

cache = "write"

873

cache = "write"

873

elif opts["update_cache"]:

874

elif opts["update_cache"]:

874

cache = "update"

875

cache = "update"

875

else:

876

else:

876

cache = None

877

cache = None

877

878

revisions = opts["revisions"]

879

revisions = opts["revisions"]

879

880

try:

881

try:

881

if args:

882

if args:

882

log = []

883

log = []

883

for d in args:

884

for d in args:

884

log += createlog(ui, d, root=opts["root"], cache=cache)

885

log += createlog(ui, d, root=opts["root"], cache=cache)

885

else:

886

else:

886

log = createlog(ui, root=opts["root"], cache=cache)

887

log = createlog(ui, root=opts["root"], cache=cache)

887

except logerror as e:

888

except logerror as e:

888

ui.write("%r\n"%e)

889

ui.write("%r\n"%e)

889

return

890

return

890

891

changesets = createchangeset(ui, log, opts["fuzz"])

892

changesets = createchangeset(ui, log, opts["fuzz"])

892

del log

893

del log

893

894

# Print changesets (optionally filtered)

895

# Print changesets (optionally filtered)

895

896

off = len(revisions)

897

off = len(revisions)

897

branches = {} # latest version number in each branch

898

branches = {} # latest version number in each branch

898

ancestors = {} # parent branch

899

ancestors = {} # parent branch

899

for cs in changesets:

900

for cs in changesets:

900

901

if opts["ancestors"]:

902

if opts["ancestors"]:

902

if cs.branch not in branches and cs.parents and cs.parents[0].id:

903

if cs.branch not in branches and cs.parents and cs.parents[0].id:

903

ancestors[cs.branch] = (changesets[cs.parents[0].id - 1].branch,

904

ancestors[cs.branch] = (changesets[cs.parents[0].id - 1].branch,

904

cs.parents[0].id)

905

cs.parents[0].id)

905

branches[cs.branch] = cs.id

906

branches[cs.branch] = cs.id

906

907

# limit by branches

908

# limit by branches

908

if opts["branches"] and (cs.branch or 'HEAD') not in opts["branches"]:

909

if opts["branches"] and (cs.branch or 'HEAD') not in opts["branches"]:

909

continue

910

continue

910

911

if not off:

912

if not off:

912

# Note: trailing spaces on several lines here are needed to have

913

# Note: trailing spaces on several lines here are needed to have

913

# bug-for-bug compatibility with cvsps.

914

# bug-for-bug compatibility with cvsps.

914

ui.write('---------------------\n')

915

ui.write('---------------------\n')

915

ui.write(('PatchSet %d \n' % cs.id))

916

ui.write(('PatchSet %d \n' % cs.id))

916

ui.write(('Date: %s\n' % dateutil.datestr(cs.date,

917

ui.write(('Date: %s\n' % dateutil.datestr(cs.date,

917

'%Y/%m/%d %H:%M:%S %1%2')))

918

'%Y/%m/%d %H:%M:%S %1%2')))

918

ui.write(('Author: %s\n' % cs.author))

919

ui.write(('Author: %s\n' % cs.author))

919

ui.write(('Branch: %s\n' % (cs.branch or 'HEAD')))

920

ui.write(('Branch: %s\n' % (cs.branch or 'HEAD')))

920

ui.write(('Tag%s: %s \n' % (['', 's'][len(cs.tags) > 1],

921

ui.write(('Tag%s: %s \n' % (['', 's'][len(cs.tags) > 1],

921

','.join(cs.tags) or '(none)')))

922

','.join(cs.tags) or '(none)')))

922

if cs.branchpoints:

923

if cs.branchpoints:

923

ui.write(('Branchpoints: %s \n') %

924

ui.write(('Branchpoints: %s \n') %

924

', '.join(sorted(cs.branchpoints)))

925

', '.join(sorted(cs.branchpoints)))

925

if opts["parents"] and cs.parents:

926

if opts["parents"] and cs.parents:

926

if len(cs.parents) > 1:

927

if len(cs.parents) > 1:

927

ui.write(('Parents: %s\n' %

928

ui.write(('Parents: %s\n' %

928

(','.join([(b"%d" % p.id) for p in cs.parents]))))

929

(','.join([(b"%d" % p.id) for p in cs.parents]))))

929

else:

930

else:

930

ui.write(('Parent: %d\n' % cs.parents[0].id))

931

ui.write(('Parent: %d\n' % cs.parents[0].id))

931

932

if opts["ancestors"]:

933

if opts["ancestors"]:

933

b = cs.branch

934

b = cs.branch

934

r = []

935

r = []

935

while b:

936

while b:

936

b, c = ancestors[b]

937

b, c = ancestors[b]

937

r.append('%s:%d:%d' % (b or "HEAD", c, branches[b]))

938

r.append('%s:%d:%d' % (b or "HEAD", c, branches[b]))

938

if r:

939

if r:

939

ui.write(('Ancestors: %s\n' % (','.join(r))))

940

ui.write(('Ancestors: %s\n' % (','.join(r))))

940

941

ui.write(('Log:\n'))

942

ui.write(('Log:\n'))

942

ui.write('%s\n\n' % cs.comment)

943

ui.write('%s\n\n' % cs.comment)

943

ui.write(('Members: \n'))

944

ui.write(('Members: \n'))

944

for f in cs.entries:

945

for f in cs.entries:

945

fn = f.file

946

fn = f.file

946

if fn.startswith(opts["prefix"]):

947

if fn.startswith(opts["prefix"]):

947

fn = fn[len(opts["prefix"]):]

948

fn = fn[len(opts["prefix"]):]

948

ui.write('\t%s:%s->%s%s \n' % (

949

ui.write('\t%s:%s->%s%s \n' % (

949

fn,

950

fn,

950

'.'.join([b"%d" % x for x in f.parent]) or 'INITIAL',

951

'.'.join([b"%d" % x for x in f.parent]) or 'INITIAL',

951

'.'.join([(b"%d" % x) for x in f.revision]),

952

'.'.join([(b"%d" % x) for x in f.revision]),

952

['', '(DEAD)'][f.dead]))

953

['', '(DEAD)'][f.dead]))

953

ui.write('\n')

954

ui.write('\n')

954

955

# have we seen the start tag?

956

# have we seen the start tag?

956

if revisions and off:

957

if revisions and off:

957

if (revisions[0] == (b"%d" % cs.id) or

958

if (revisions[0] == (b"%d" % cs.id) or

958

revisions[0] in cs.tags):

959

revisions[0] in cs.tags):

959

off = False

960

off = False

960

961

# see if we reached the end tag

962

# see if we reached the end tag

962

if len(revisions) > 1 and not off:

963

if len(revisions) > 1 and not off:

963

if (revisions[1] == (b"%d" % cs.id) or

964

if (revisions[1] == (b"%d" % cs.id) or

964

revisions[1] in cs.tags):

965

revisions[1] in cs.tags):

965

break

966

break

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # Mercurial built-in replacement for cvsps.
             #
             # Copyright 2008, Frank Kingswood <frank@kingswood-consulting.co.uk>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from __future__ import absolute_import
             import functools
             import os
             import re
             from mercurial.i18n import _
             from mercurial import (
                 encoding,
                 error,
                 hook,
                 pycompat,
                 util,
             )
             from mercurial.utils import (
                 dateutil,
                 procutil,
                 stringutil,
             )
             pickle = util.pickle
             class logentry(object):
                 '''Class logentry has the following attributes:
                     .author    - author name as CVS knows it
                     .branch    - name of branch this revision is on
                     .branches  - revision tuple of branches starting at this revision
                     .comment   - commit message
                     .commitid  - CVS commitid or None
                     .date      - the commit date as a (time, tz) tuple
                     .dead      - true if file revision is dead
                     .file      - Name of file
                     .lines     - a tuple (+lines, -lines) or None
                     .parent    - Previous revision of this entry
                     .rcs       - name of file as returned from CVS
                     .revision  - revision number as tuple
                     .tags      - list of tags on the file
                     .synthetic - is this a synthetic "file ... added on ..." revision?
                     .mergepoint - the branch that has been merged from (if present in
                                   rlog output) or None
                     .branchpoints - the branches that start at the current entry or empty
                 '''
                 def __init__(self, **entries):
                     self.synthetic = False
                     self.__dict__.update(entries)
                 def __repr__(self):
                     items = (r"%s=%r"%(k, self.__dict__[k]) for k in sorted(self.__dict__))
                     return r"%s(%s)"%(type(self).__name__, r", ".join(items))
             class logerror(Exception):
                 pass
             def getrepopath(cvspath):
                 """Return the repository path from a CVS path.
                 >>> getrepopath(b'/foo/bar')
                 '/foo/bar'
                 >>> getrepopath(b'c:/foo/bar')
                 '/foo/bar'
                 >>> getrepopath(b':pserver:10/foo/bar')
                 '/foo/bar'
                 >>> getrepopath(b':pserver:10c:/foo/bar')
                 '/foo/bar'
                 >>> getrepopath(b':pserver:/foo/bar')
                 '/foo/bar'
                 >>> getrepopath(b':pserver:c:/foo/bar')
                 '/foo/bar'
                 >>> getrepopath(b':pserver:truc@foo.bar:/foo/bar')
                 '/foo/bar'
                 >>> getrepopath(b':pserver:truc@foo.bar:c:/foo/bar')
                 '/foo/bar'
                 >>> getrepopath(b'user@server/path/to/repository')
                 '/path/to/repository'
                 """
                 # According to CVS manual, CVS paths are expressed like:
                 # [:method:][[user][:password]@]hostname[:[port]]/path/to/repository
                 #
                 # CVSpath is splitted into parts and then position of the first occurrence
                 # of the '/' char after the '@' is located. The solution is the rest of the
                 # string after that '/' sign including it
                 parts = cvspath.split(':')
                 atposition = parts[-1].find('@')
                 start = 0
                 if atposition != -1:
                     start = atposition
                 repopath = parts[-1][parts[-1].find('/', start):]
                 return repopath
             def createlog(ui, directory=None, root="", rlog=True, cache=None):
                 '''Collect the CVS rlog'''
                 # Because we store many duplicate commit log messages, reusing strings
                 # saves a lot of memory and pickle storage space.
                 _scache = {}
                 def scache(s):
                     "return a shared version of a string"
                     return _scache.setdefault(s, s)
                 ui.status(_('collecting CVS rlog\n'))
                 log = []      # list of logentry objects containing the CVS state
                 # patterns to match in CVS (r)log output, by state of use
                 re_00 = re.compile(b'RCS file: (.+)$')
                 re_01 = re.compile(b'cvs \\[r?log aborted\\]: (.+)$')
                 re_02 = re.compile(b'cvs (r?log|server): (.+)\n$')
                 re_03 = re.compile(b"(Cannot access.+CVSROOT)|"
                                    b"(can't create temporary directory.+)$")
                 re_10 = re.compile(b'Working file: (.+)$')
                 re_20 = re.compile(b'symbolic names:')
                 re_30 = re.compile(b'\t(.+): ([\\d.]+)$')
                 re_31 = re.compile(b'----------------------------$')
                 re_32 = re.compile(b'======================================='
                                    b'======================================$')
                 re_50 = re.compile(br'revision ([\d.]+)(\s+locked by:\s+.+;)?$')
                 re_60 = re.compile(br'date:\s+(.+);\s+author:\s+(.+);\s+state:\s+(.+?);'
                                    br'(\s+lines:\s+(\+\d+)?\s+(-\d+)?;)?'
                                    br'(\s+commitid:\s+([^;]+);)?'
                                    br'(.*mergepoint:\s+([^;]+);)?')
                 re_70 = re.compile(b'branches: (.+);$')
                 file_added_re = re.compile(br'file [^/]+ was (initially )?added on branch')
                 prefix = ''   # leading path to strip of what we get from CVS
                 if directory is None:
                     # Current working directory
                     # Get the real directory in the repository
                     try:
-                        prefix = open(os.path.join('CVS','Repository'), 'rb').read().strip()
+                        with open(os.path.join(b'CVS', b'Repository'), 'rb') as f:
+                            prefix = f.read().strip()
                         directory = prefix
                         if prefix == ".":
                             prefix = ""
                     except IOError:
                         raise logerror(_('not a CVS sandbox'))
                     if prefix and not prefix.endswith(pycompat.ossep):
                         prefix += pycompat.ossep
                     # Use the Root file in the sandbox, if it exists
                     try:
                         root = open(os.path.join('CVS','Root'), 'rb').read().strip()
                     except IOError:
                         pass
                 if not root:
                     root = encoding.environ.get('CVSROOT', '')
                 # read log cache if one exists
                 oldlog = []
                 date = None
                 if cache:
                     cachedir = os.path.expanduser('~/.hg.cvsps')
                     if not os.path.exists(cachedir):
                         os.mkdir(cachedir)
                     # The cvsps cache pickle needs a uniquified name, based on the
                     # repository location. The address may have all sort of nasties
                     # in it, slashes, colons and such. So here we take just the
                     # alphanumeric characters, concatenated in a way that does not
                     # mix up the various components, so that
                     #    :pserver:user@server:/path
                     # and
                     #    /pserver/user/server/path
                     # are mapped to different cache file names.
                     cachefile = root.split(":") + [directory, "cache"]
                     cachefile = ['-'.join(re.findall(br'\w+', s)) for s in cachefile if s]
                     cachefile = os.path.join(cachedir,
                                              '.'.join([s for s in cachefile if s]))
                 if cache == 'update':
                     try:
                         ui.note(_('reading cvs log cache %s\n') % cachefile)
                         oldlog = pickle.load(open(cachefile, 'rb'))
                         for e in oldlog:
                             if not (util.safehasattr(e, 'branchpoints') and
                                     util.safehasattr(e, 'commitid') and
                                     util.safehasattr(e, 'mergepoint')):
                                 ui.status(_('ignoring old cache\n'))
                                 oldlog = []
                                 break
                         ui.note(_('cache has %d log entries\n') % len(oldlog))
                     except Exception as e:
                         ui.note(_('error reading cache: %r\n') % e)
                     if oldlog:
                         date = oldlog[-1].date    # last commit date as a (time,tz) tuple
                         date = dateutil.datestr(date, '%Y/%m/%d %H:%M:%S %1%2')
                 # build the CVS commandline
                 cmd = ['cvs', '-q']
                 if root:
                     cmd.append('-d%s' % root)
                     p = util.normpath(getrepopath(root))
                     if not p.endswith('/'):
                         p += '/'
                     if prefix:
                         # looks like normpath replaces "" by "."
                         prefix = p + util.normpath(prefix)
                     else:
                         prefix = p
                 cmd.append(['log', 'rlog'][rlog])
                 if date:
                     # no space between option and date string
                     cmd.append('-d>%s' % date)
                 cmd.append(directory)
                 # state machine begins here
                 tags = {}     # dictionary of revisions on current file with their tags
                 branchmap = {} # mapping between branch names and revision numbers
                 rcsmap = {}
                 state = 0
                 store = False # set when a new record can be appended
                 cmd = [procutil.shellquote(arg) for arg in cmd]
                 ui.note(_("running %s\n") % (' '.join(cmd)))
                 ui.debug("prefix=%r directory=%r root=%r\n" % (prefix, directory, root))
                 pfp = procutil.popen(' '.join(cmd), 'rb')
                 peek = util.fromnativeeol(pfp.readline())
                 while True:
                     line = peek
                     if line == '':
                         break
                     peek = util.fromnativeeol(pfp.readline())
                     if line.endswith('\n'):
                         line = line[:-1]
                     #ui.debug('state=%d line=%r\n' % (state, line))
                     if state == 0:
                         # initial state, consume input until we see 'RCS file'
                         match = re_00.match(line)
                         if match:
                             rcs = match.group(1)
                             tags = {}
                             if rlog:
                                 filename = util.normpath(rcs[:-2])
                                 if filename.startswith(prefix):
                                     filename = filename[len(prefix):]
                                 if filename.startswith('/'):
                                     filename = filename[1:]
                                 if filename.startswith('Attic/'):
                                     filename = filename[6:]
                                 else:
                                     filename = filename.replace('/Attic/', '/')
                                 state = 2
                                 continue
                             state = 1
                             continue
                         match = re_01.match(line)
                         if match:
                             raise logerror(match.group(1))
                         match = re_02.match(line)
                         if match:
                             raise logerror(match.group(2))
                         if re_03.match(line):
                             raise logerror(line)
                     elif state == 1:
                         # expect 'Working file' (only when using log instead of rlog)
                         match = re_10.match(line)
                         assert match, _('RCS file must be followed by working file')
                         filename = util.normpath(match.group(1))
                         state = 2
                     elif state == 2:
                         # expect 'symbolic names'
                         if re_20.match(line):
                             branchmap = {}
                             state = 3
                     elif state == 3:
                         # read the symbolic names and store as tags
                         match = re_30.match(line)
                         if match:
                             rev = [int(x) for x in match.group(2).split('.')]
                             # Convert magic branch number to an odd-numbered one
                             revn = len(rev)
                             if revn > 3 and (revn % 2) == 0 and rev[-2] == 0:
                                 rev = rev[:-2] + rev[-1:]
                             rev = tuple(rev)
                             if rev not in tags:
                                 tags[rev] = []
                             tags[rev].append(match.group(1))
                             branchmap[match.group(1)] = match.group(2)
                         elif re_31.match(line):
                             state = 5
                         elif re_32.match(line):
                             state = 0
                     elif state == 4:
                         # expecting '------' separator before first revision
                         if re_31.match(line):
                             state = 5
                         else:
                             assert not re_32.match(line), _('must have at least '
                                                             'some revisions')
                     elif state == 5:
                         # expecting revision number and possibly (ignored) lock indication
                         # we create the logentry here from values stored in states 0 to 4,
                         # as this state is re-entered for subsequent revisions of a file.
                         match = re_50.match(line)
                         assert match, _('expected revision number')
                         e = logentry(rcs=scache(rcs),
                                      file=scache(filename),
                                      revision=tuple([int(x) for x in
                                                      match.group(1).split('.')]),
                                      branches=[],
                                      parent=None,
                                      commitid=None,
                                      mergepoint=None,
                                      branchpoints=set())
                         state = 6
                     elif state == 6:
                         # expecting date, author, state, lines changed
                         match = re_60.match(line)
                         assert match, _('revision must be followed by date line')
                         d = match.group(1)
                         if d[2] == '/':
                             # Y2K
                             d = '19' + d
                         if len(d.split()) != 3:
                             # cvs log dates always in GMT
                             d = d + ' UTC'
                         e.date = dateutil.parsedate(d, ['%y/%m/%d %H:%M:%S',
                                                     '%Y/%m/%d %H:%M:%S',
                                                     '%Y-%m-%d %H:%M:%S'])
                         e.author = scache(match.group(2))
                         e.dead = match.group(3).lower() == 'dead'
                         if match.group(5):
                             if match.group(6):
                                 e.lines = (int(match.group(5)), int(match.group(6)))
                             else:
                                 e.lines = (int(match.group(5)), 0)
                         elif match.group(6):
                             e.lines = (0, int(match.group(6)))
                         else:
                             e.lines = None
                         if match.group(7): # cvs 1.12 commitid
                             e.commitid = match.group(8)
                         if match.group(9): # cvsnt mergepoint
                             myrev = match.group(10).split('.')
                             if len(myrev) == 2: # head
                                 e.mergepoint = 'HEAD'
                             else:
                                 myrev = '.'.join(myrev[:-2] + ['0', myrev[-2]])
                                 branches = [b for b in branchmap if branchmap[b] == myrev]
                                 assert len(branches) == 1, ('unknown branch: %s'
                                                             % e.mergepoint)
                                 e.mergepoint = branches[0]
                         e.comment = []
                         state = 7
                     elif state == 7:
                         # read the revision numbers of branches that start at this revision
                         # or store the commit log message otherwise
                         m = re_70.match(line)
                         if m:
                             e.branches = [tuple([int(y) for y in x.strip().split('.')])
                                             for x in m.group(1).split(';')]
                             state = 8
                         elif re_31.match(line) and re_50.match(peek):
                             state = 5
                             store = True
                         elif re_32.match(line):
                             state = 0
                             store = True
                         else:
                             e.comment.append(line)
                     elif state == 8:
                         # store commit log message
                         if re_31.match(line):
                             cpeek = peek
                             if cpeek.endswith('\n'):
                                 cpeek = cpeek[:-1]
                             if re_50.match(cpeek):
                                 state = 5
                                 store = True
                             else:
                                 e.comment.append(line)
                         elif re_32.match(line):
                             state = 0
                             store = True
                         else:
                             e.comment.append(line)
                     # When a file is added on a branch B1, CVS creates a synthetic
                     # dead trunk revision 1.1 so that the branch has a root.
                     # Likewise, if you merge such a file to a later branch B2 (one
                     # that already existed when the file was added on B1), CVS
                     # creates a synthetic dead revision 1.1.x.1 on B2.  Don't drop
                     # these revisions now, but mark them synthetic so
                     # createchangeset() can take care of them.
                     if (store and
                           e.dead and
                           e.revision[-1] == 1 and      # 1.1 or 1.1.x.1
                           len(e.comment) == 1 and
                           file_added_re.match(e.comment[0])):
                         ui.debug('found synthetic revision in %s: %r\n'
                                  % (e.rcs, e.comment[0]))
                         e.synthetic = True
                     if store:
                         # clean up the results and save in the log.
                         store = False
                         e.tags = sorted([scache(x) for x in tags.get(e.revision, [])])
                         e.comment = scache('\n'.join(e.comment))
                         revn = len(e.revision)
                         if revn > 3 and (revn % 2) == 0:
                             e.branch = tags.get(e.revision[:-1], [None])[0]
                         else:
                             e.branch = None
                         # find the branches starting from this revision
                         branchpoints = set()
                         for branch, revision in branchmap.iteritems():
                             revparts = tuple([int(i) for i in revision.split('.')])
                             if len(revparts) < 2: # bad tags
                                 continue
                             if revparts[-2] == 0 and revparts[-1] % 2 == 0:
                                 # normal branch
                                 if revparts[:-2] == e.revision:
                                     branchpoints.add(branch)
                             elif revparts == (1, 1, 1): # vendor branch
                                 if revparts in e.branches:
                                     branchpoints.add(branch)
                         e.branchpoints = branchpoints
                         log.append(e)
                         rcsmap[e.rcs.replace('/Attic/', '/')] = e.rcs
                         if len(log) % 100 == 0:
                             ui.status(stringutil.ellipsis('%d %s' % (len(log), e.file), 80)
                                       + '\n')
                 log.sort(key=lambda x: (x.rcs, x.revision))
                 # find parent revisions of individual files
                 versions = {}
                 for e in sorted(oldlog, key=lambda x: (x.rcs, x.revision)):
                     rcs = e.rcs.replace('/Attic/', '/')
                     if rcs in rcsmap:
                         e.rcs = rcsmap[rcs]
                     branch = e.revision[:-1]
                     versions[(e.rcs, branch)] = e.revision
                 for e in log:
                     branch = e.revision[:-1]
                     p = versions.get((e.rcs, branch), None)
                     if p is None:
                         p = e.revision[:-2]
                     e.parent = p
                     versions[(e.rcs, branch)] = e.revision
                 # update the log cache
                 if cache:
                     if log:
                         # join up the old and new logs
                         log.sort(key=lambda x: x.date)
                         if oldlog and oldlog[-1].date >= log[0].date:
                             raise logerror(_('log cache overlaps with new log entries,'
                                              ' re-run without cache.'))
                         log = oldlog + log
                         # write the new cachefile
                         ui.note(_('writing cvs log cache %s\n') % cachefile)
                         pickle.dump(log, open(cachefile, 'wb'))
                     else:
                         log = oldlog
                 ui.status(_('%d log entries\n') % len(log))
                 encodings = ui.configlist('convert', 'cvsps.logencoding')
                 if encodings:
                     def revstr(r):
                         # this is needed, because logentry.revision is a tuple of "int"
                         # (e.g. (1, 2) for "1.2")
                         return '.'.join(pycompat.maplist(pycompat.bytestr, r))
                     for entry in log:
                         comment = entry.comment
                         for e in encodings:
                             try:
                                 entry.comment = comment.decode(
                                     pycompat.sysstr(e)).encode('utf-8')
                                 if ui.debugflag:
                                     ui.debug("transcoding by %s: %s of %s\n" %
                                              (e, revstr(entry.revision), entry.file))
                                 break
                             except UnicodeDecodeError:
                                 pass # try next encoding
                             except LookupError as inst: # unknown encoding, maybe
                                 raise error.Abort(inst,
                                                   hint=_('check convert.cvsps.logencoding'
                                                          ' configuration'))
                         else:
                             raise error.Abort(_("no encoding can transcode"
                                                 " CVS log message for %s of %s")
                                               % (revstr(entry.revision), entry.file),
                                               hint=_('check convert.cvsps.logencoding'
                                                      ' configuration'))
                 hook.hook(ui, None, "cvslog", True, log=log)
                 return log
             class changeset(object):
                 '''Class changeset has the following attributes:
                     .id        - integer identifying this changeset (list index)
                     .author    - author name as CVS knows it
                     .branch    - name of branch this changeset is on, or None
                     .comment   - commit message
                     .commitid  - CVS commitid or None
                     .date      - the commit date as a (time,tz) tuple
                     .entries   - list of logentry objects in this changeset
                     .parents   - list of one or two parent changesets
                     .tags      - list of tags on this changeset
                     .synthetic - from synthetic revision "file ... added on branch ..."
                     .mergepoint- the branch that has been merged from or None
                     .branchpoints- the branches that start at the current entry or empty
                 '''
                 def __init__(self, **entries):
                     self.id = None
                     self.synthetic = False
                     self.__dict__.update(entries)
                 def __repr__(self):
                     items = ("%s=%r"%(k, self.__dict__[k]) for k in sorted(self.__dict__))
                     return "%s(%s)"%(type(self).__name__, ", ".join(items))
             def createchangeset(ui, log, fuzz=60, mergefrom=None, mergeto=None):
                 '''Convert log into changesets.'''
                 ui.status(_('creating changesets\n'))
                 # try to order commitids by date
                 mindate = {}
                 for e in log:
                     if e.commitid:
                         if e.commitid not in mindate:
                             mindate[e.commitid] = e.date
                         else:
                             mindate[e.commitid] = min(e.date, mindate[e.commitid])
                 # Merge changesets
                 log.sort(key=lambda x: (mindate.get(x.commitid, (-1, 0)),
                                         x.commitid or '', x.comment,
                                         x.author, x.branch or '', x.date, x.branchpoints))
                 changesets = []
                 files = set()
                 c = None
                 for i, e in enumerate(log):
                     # Check if log entry belongs to the current changeset or not.
                     # Since CVS is file-centric, two different file revisions with
                     # different branchpoints should be treated as belonging to two
                     # different changesets (and the ordering is important and not
                     # honoured by cvsps at this point).
                     #
                     # Consider the following case:
                     # foo 1.1 branchpoints: [MYBRANCH]
                     # bar 1.1 branchpoints: [MYBRANCH, MYBRANCH2]
                     #
                     # Here foo is part only of MYBRANCH, but not MYBRANCH2, e.g. a
                     # later version of foo may be in MYBRANCH2, so foo should be the
                     # first changeset and bar the next and MYBRANCH and MYBRANCH2
                     # should both start off of the bar changeset. No provisions are
                     # made to ensure that this is, in fact, what happens.
                     if not (c and e.branchpoints == c.branchpoints and
                             (# cvs commitids
                              (e.commitid is not None and e.commitid == c.commitid) or
                              (# no commitids, use fuzzy commit detection
                               (e.commitid is None or c.commitid is None) and
                                e.comment == c.comment and
                                e.author == c.author and
                                e.branch == c.branch and
                                ((c.date[0] + c.date[1]) <=
                                 (e.date[0] + e.date[1]) <=
                                 (c.date[0] + c.date[1]) + fuzz) and
                                e.file not in files))):
                         c = changeset(comment=e.comment, author=e.author,
                                       branch=e.branch, date=e.date,
                                       entries=[], mergepoint=e.mergepoint,
                                       branchpoints=e.branchpoints, commitid=e.commitid)
                         changesets.append(c)
                         files = set()
                         if len(changesets) % 100 == 0:
                             t = '%d %s' % (len(changesets), repr(e.comment)[1:-1])
                             ui.status(stringutil.ellipsis(t, 80) + '\n')
                     c.entries.append(e)
                     files.add(e.file)
                     c.date = e.date       # changeset date is date of latest commit in it
                 # Mark synthetic changesets
                 for c in changesets:
                     # Synthetic revisions always get their own changeset, because
                     # the log message includes the filename.  E.g. if you add file3
                     # and file4 on a branch, you get four log entries and three
                     # changesets:
                     #   "File file3 was added on branch ..." (synthetic, 1 entry)
                     #   "File file4 was added on branch ..." (synthetic, 1 entry)
                     #   "Add file3 and file4 to fix ..."     (real, 2 entries)
                     # Hence the check for 1 entry here.
                     c.synthetic = len(c.entries) == 1 and c.entries[0].synthetic
                 # Sort files in each changeset
                 def entitycompare(l, r):
                     'Mimic cvsps sorting order'
                     l = l.file.split('/')
                     r = r.file.split('/')
                     nl = len(l)
                     nr = len(r)
                     n = min(nl, nr)
                     for i in range(n):
                         if i + 1 == nl and nl < nr:
                             return -1
                         elif i + 1 == nr and nl > nr:
                             return +1
                         elif l[i] < r[i]:
                             return -1
                         elif l[i] > r[i]:
                             return +1
                     return 0
                 for c in changesets:
                     c.entries.sort(key=functools.cmp_to_key(entitycompare))
                 # Sort changesets by date
                 odd = set()
                 def cscmp(l, r):
                     d = sum(l.date) - sum(r.date)
                     if d:
                         return d
                     # detect vendor branches and initial commits on a branch
                     le = {}
                     for e in l.entries:
                         le[e.rcs] = e.revision
                     re = {}
                     for e in r.entries:
                         re[e.rcs] = e.revision
                     d = 0
                     for e in l.entries:
                         if re.get(e.rcs, None) == e.parent:
                             assert not d
                             d = 1
                             break
                     for e in r.entries:
                         if le.get(e.rcs, None) == e.parent:
                             if d:
                                 odd.add((l, r))
                             d = -1
                             break
                     # By this point, the changesets are sufficiently compared that
                     # we don't really care about ordering. However, this leaves
                     # some race conditions in the tests, so we compare on the
                     # number of files modified, the files contained in each
                     # changeset, and the branchpoints in the change to ensure test
                     # output remains stable.
                     # recommended replacement for cmp from
                     # https://docs.python.org/3.0/whatsnew/3.0.html
                     c = lambda x, y: (x > y) - (x < y)
                     # Sort bigger changes first.
                     if not d:
                         d = c(len(l.entries), len(r.entries))
                     # Try sorting by filename in the change.
                     if not d:
                         d = c([e.file for e in l.entries], [e.file for e in r.entries])
                     # Try and put changes without a branch point before ones with
                     # a branch point.
                     if not d:
                         d = c(len(l.branchpoints), len(r.branchpoints))
                     return d
                 changesets.sort(key=functools.cmp_to_key(cscmp))
                 # Collect tags
                 globaltags = {}
                 for c in changesets:
                     for e in c.entries:
                         for tag in e.tags:
                             # remember which is the latest changeset to have this tag
                             globaltags[tag] = c
                 for c in changesets:
                     tags = set()
                     for e in c.entries:
                         tags.update(e.tags)
                     # remember tags only if this is the latest changeset to have it
                     c.tags = sorted(tag for tag in tags if globaltags[tag] is c)
                 # Find parent changesets, handle {{mergetobranch BRANCHNAME}}
                 # by inserting dummy changesets with two parents, and handle
                 # {{mergefrombranch BRANCHNAME}} by setting two parents.
                 if mergeto is None:
                     mergeto = br'{{mergetobranch ([-\w]+)}}'
                 if mergeto:
                     mergeto = re.compile(mergeto)
                 if mergefrom is None:
                     mergefrom = br'{{mergefrombranch ([-\w]+)}}'
                 if mergefrom:
                     mergefrom = re.compile(mergefrom)
                 versions = {}    # changeset index where we saw any particular file version
                 branches = {}    # changeset index where we saw a branch
                 n = len(changesets)
                 i = 0
                 while i < n:
                     c = changesets[i]
                     for f in c.entries:
                         versions[(f.rcs, f.revision)] = i
                     p = None
                     if c.branch in branches:
                         p = branches[c.branch]
                     else:
                         # first changeset on a new branch
                         # the parent is a changeset with the branch in its
                         # branchpoints such that it is the latest possible
                         # commit without any intervening, unrelated commits.
                         for candidate in pycompat.xrange(i):
                             if c.branch not in changesets[candidate].branchpoints:
                                 if p is not None:
                                     break
                                 continue
                             p = candidate
                     c.parents = []
                     if p is not None:
                         p = changesets[p]
                         # Ensure no changeset has a synthetic changeset as a parent.
                         while p.synthetic:
                             assert len(p.parents) <= 1, (
                                    _('synthetic changeset cannot have multiple parents'))
                             if p.parents:
                                 p = p.parents[0]
                             else:
                                 p = None
                                 break
                         if p is not None:
                             c.parents.append(p)
                     if c.mergepoint:
                         if c.mergepoint == 'HEAD':
                             c.mergepoint = None
                         c.parents.append(changesets[branches[c.mergepoint]])
                     if mergefrom:
                         m = mergefrom.search(c.comment)
                         if m:
                             m = m.group(1)
                             if m == 'HEAD':
                                 m = None
                             try:
                                 candidate = changesets[branches[m]]
                             except KeyError:
                                 ui.warn(_("warning: CVS commit message references "
                                           "non-existent branch %r:\n%s\n")
                                         % (pycompat.bytestr(m), c.comment))
                             if m in branches and c.branch != m and not candidate.synthetic:
                                 c.parents.append(candidate)
                     if mergeto:
                         m = mergeto.search(c.comment)
                         if m:
                             if m.groups():
                                 m = m.group(1)
                                 if m == 'HEAD':
                                     m = None
                             else:
                                 m = None   # if no group found then merge to HEAD
                             if m in branches and c.branch != m:
                                 # insert empty changeset for merge
                                 cc = changeset(
                                     author=c.author, branch=m, date=c.date,
                                     comment='convert-repo: CVS merge from branch %s'
                                     % c.branch,
                                     entries=[], tags=[],
                                     parents=[changesets[branches[m]], c])
                                 changesets.insert(i + 1, cc)
                                 branches[m] = i + 1
                                 # adjust our loop counters now we have inserted a new entry
                                 n += 1
                                 i += 2
                                 continue
                     branches[c.branch] = i
                     i += 1
                 # Drop synthetic changesets (safe now that we have ensured no other
                 # changesets can have them as parents).
                 i = 0
                 while i < len(changesets):
                     if changesets[i].synthetic:
                         del changesets[i]
                     else:
                         i += 1
                 # Number changesets
                 for i, c in enumerate(changesets):
                     c.id = i + 1
                 if odd:
                     for l, r in odd:
                         if l.id is not None and r.id is not None:
                             ui.warn(_('changeset %d is both before and after %d\n')
                                     % (l.id, r.id))
                 ui.status(_('%d changeset entries\n') % len(changesets))
                 hook.hook(ui, None, "cvschangesets", True, changesets=changesets)
                 return changesets
             def debugcvsps(ui, *args, **opts):
                 '''Read CVS rlog for current directory or named path in
                 repository, and convert the log to changesets based on matching
                 commit log entries and dates.
                 '''
                 opts = pycompat.byteskwargs(opts)
                 if opts["new_cache"]:
                     cache = "write"
                 elif opts["update_cache"]:
                     cache = "update"
                 else:
                     cache = None
                 revisions = opts["revisions"]
                 try:
                     if args:
                         log = []
                         for d in args:
                             log += createlog(ui, d, root=opts["root"], cache=cache)
                     else:
                         log = createlog(ui, root=opts["root"], cache=cache)
                 except logerror as e:
                     ui.write("%r\n"%e)
                     return
                 changesets = createchangeset(ui, log, opts["fuzz"])
                 del log
                 # Print changesets (optionally filtered)
                 off = len(revisions)
                 branches = {}    # latest version number in each branch
                 ancestors = {}   # parent branch
                 for cs in changesets:
                     if opts["ancestors"]:
                         if cs.branch not in branches and cs.parents and cs.parents[0].id:
                             ancestors[cs.branch] = (changesets[cs.parents[0].id - 1].branch,
                                                     cs.parents[0].id)
                         branches[cs.branch] = cs.id
                     # limit by branches
                     if opts["branches"] and (cs.branch or 'HEAD') not in opts["branches"]:
                         continue
                     if not off:
                         # Note: trailing spaces on several lines here are needed to have
                         #       bug-for-bug compatibility with cvsps.
                         ui.write('---------------------\n')
                         ui.write(('PatchSet %d \n' % cs.id))
                         ui.write(('Date: %s\n' % dateutil.datestr(cs.date,
                                                              '%Y/%m/%d %H:%M:%S %1%2')))
                         ui.write(('Author: %s\n' % cs.author))
                         ui.write(('Branch: %s\n' % (cs.branch or 'HEAD')))
                         ui.write(('Tag%s: %s \n' % (['', 's'][len(cs.tags) > 1],
                                               ','.join(cs.tags) or '(none)')))
                         if cs.branchpoints:
                             ui.write(('Branchpoints: %s \n') %
                                      ', '.join(sorted(cs.branchpoints)))
                         if opts["parents"] and cs.parents:
                             if len(cs.parents) > 1:
                                 ui.write(('Parents: %s\n' %
                                          (','.join([(b"%d" % p.id) for p in cs.parents]))))
                             else:
                                 ui.write(('Parent: %d\n' % cs.parents[0].id))
                         if opts["ancestors"]:
                             b = cs.branch
                             r = []
                             while b:
                                 b, c = ancestors[b]
                                 r.append('%s:%d:%d' % (b or "HEAD", c, branches[b]))
                             if r:
                                 ui.write(('Ancestors: %s\n' % (','.join(r))))
                         ui.write(('Log:\n'))
                         ui.write('%s\n\n' % cs.comment)
                         ui.write(('Members: \n'))
                         for f in cs.entries:
                             fn = f.file
                             if fn.startswith(opts["prefix"]):
                                 fn = fn[len(opts["prefix"]):]
                             ui.write('\t%s:%s->%s%s \n' % (
                                     fn,
                                     '.'.join([b"%d" % x for x in f.parent]) or 'INITIAL',
                                     '.'.join([(b"%d" % x) for x in f.revision]),
                                     ['', '(DEAD)'][f.dead]))
                         ui.write('\n')
                     # have we seen the start tag?
                     if revisions and off:
                         if (revisions[0] == (b"%d" % cs.id) or
                             revisions[0] in cs.tags):
                             off = False
                     # see if we reached the end tag
                     if len(revisions) > 1 and not off:
                         if (revisions[1] == (b"%d" % cs.id) or
                             revisions[1] in cs.tags):
                             break