upstream/mercurial-mirror Commit - r37901:72284d29

1

# Mercurial built-in replacement for cvsps.

1

# Mercurial built-in replacement for cvsps.

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

from __future__ import absolute_import

7

from __future__ import absolute_import

8

9

import os

9

import os

10

import re

10

import re

11

12

from mercurial.i18n import _

12

from mercurial.i18n import _

13

from mercurial import (

13

from mercurial import (

14

encoding,

14

encoding,

15

error,

15

error,

16

hook,

16

hook,

17

pycompat,

17

pycompat,

18

util,

18

util,

19

)

19

)

20

from mercurial.utils import (

20

from mercurial.utils import (

21

dateutil,

21

dateutil,

22

procutil,

22

procutil,

23

stringutil,

23

stringutil,

24

)

24

)

25

26

pickle = util.pickle

26

pickle = util.pickle

27

28

class logentry(object):

28

class logentry(object):

29

'''Class logentry has the following attributes:

29

'''Class logentry has the following attributes:

30

.author - author name as CVS knows it

30

.author - author name as CVS knows it

31

.branch - name of branch this revision is on

31

.branch - name of branch this revision is on

32

.branches - revision tuple of branches starting at this revision

32

.branches - revision tuple of branches starting at this revision

33

.comment - commit message

33

.comment - commit message

34

.commitid - CVS commitid or None

34

.commitid - CVS commitid or None

35

.date - the commit date as a (time, tz) tuple

35

.date - the commit date as a (time, tz) tuple

36

.dead - true if file revision is dead

36

.dead - true if file revision is dead

37

.file - Name of file

37

.file - Name of file

38

.lines - a tuple (+lines, -lines) or None

38

.lines - a tuple (+lines, -lines) or None

39

.parent - Previous revision of this entry

39

.parent - Previous revision of this entry

40

.rcs - name of file as returned from CVS

40

.rcs - name of file as returned from CVS

41

.revision - revision number as tuple

41

.revision - revision number as tuple

42

.tags - list of tags on the file

42

.tags - list of tags on the file

43

.synthetic - is this a synthetic "file ... added on ..." revision?

43

.synthetic - is this a synthetic "file ... added on ..." revision?

44

.mergepoint - the branch that has been merged from (if present in

44

.mergepoint - the branch that has been merged from (if present in

45

rlog output) or None

45

rlog output) or None

46

.branchpoints - the branches that start at the current entry or empty

46

.branchpoints - the branches that start at the current entry or empty

47

'''

47

'''

48

def __init__(self, **entries):

48

def __init__(self, **entries):

49

self.synthetic = False

49

self.synthetic = False

50

self.__dict__.update(entries)

50

self.__dict__.update(entries)

51

52

def __repr__(self):

52

def __repr__(self):

53

items = ("%s=%r"%(k, self.__dict__[k]) for k in sorted(self.__dict__))

53

items = ("%s=%r"%(k, self.__dict__[k]) for k in sorted(self.__dict__))

54

return "%s(%s)"%(type(self).__name__, ", ".join(items))

54

return "%s(%s)"%(type(self).__name__, ", ".join(items))

55

56

class logerror(Exception):

56

class logerror(Exception):

57

pass

57

pass

58

59

def getrepopath(cvspath):

59

def getrepopath(cvspath):

60

"""Return the repository path from a CVS path.

60

"""Return the repository path from a CVS path.

61

62

>>> getrepopath(b'/foo/bar')

62

>>> getrepopath(b'/foo/bar')

63

'/foo/bar'

63

'/foo/bar'

64

>>> getrepopath(b'c:/foo/bar')

64

>>> getrepopath(b'c:/foo/bar')

65

'/foo/bar'

65

'/foo/bar'

66

>>> getrepopath(b':pserver:10/foo/bar')

66

>>> getrepopath(b':pserver:10/foo/bar')

67

'/foo/bar'

67

'/foo/bar'

68

>>> getrepopath(b':pserver:10c:/foo/bar')

68

>>> getrepopath(b':pserver:10c:/foo/bar')

69

'/foo/bar'

69

'/foo/bar'

70

>>> getrepopath(b':pserver:/foo/bar')

70

>>> getrepopath(b':pserver:/foo/bar')

71

'/foo/bar'

71

'/foo/bar'

72

>>> getrepopath(b':pserver:c:/foo/bar')

72

>>> getrepopath(b':pserver:c:/foo/bar')

73

'/foo/bar'

73

'/foo/bar'

74

>>> getrepopath(b':pserver:truc@foo.bar:/foo/bar')

74

>>> getrepopath(b':pserver:truc@foo.bar:/foo/bar')

75

'/foo/bar'

75

'/foo/bar'

76

>>> getrepopath(b':pserver:truc@foo.bar:c:/foo/bar')

76

>>> getrepopath(b':pserver:truc@foo.bar:c:/foo/bar')

77

'/foo/bar'

77

'/foo/bar'

78

>>> getrepopath(b'user@server/path/to/repository')

78

>>> getrepopath(b'user@server/path/to/repository')

79

'/path/to/repository'

79

'/path/to/repository'

80

"""

80

"""

81

# According to CVS manual, CVS paths are expressed like:

81

# According to CVS manual, CVS paths are expressed like:

82

# [:method:][[user][:password]@]hostname[:[port]]/path/to/repository

82

# [:method:][[user][:password]@]hostname[:[port]]/path/to/repository

83

#

83

#

84

# CVSpath is splitted into parts and then position of the first occurrence

84

# CVSpath is splitted into parts and then position of the first occurrence

85

# of the '/' char after the '@' is located. The solution is the rest of the

85

# of the '/' char after the '@' is located. The solution is the rest of the

86

# string after that '/' sign including it

86

# string after that '/' sign including it

87

88

parts = cvspath.split(':')

88

parts = cvspath.split(':')

89

atposition = parts[-1].find('@')

89

atposition = parts[-1].find('@')

90

start = 0

90

start = 0

91

92

if atposition != -1:

92

if atposition != -1:

93

start = atposition

93

start = atposition

94

95

repopath = parts[-1][parts[-1].find('/', start):]

95

repopath = parts[-1][parts[-1].find('/', start):]

96

return repopath

96

return repopath

97

98

def createlog(ui, directory=None, root="", rlog=True, cache=None):

98

def createlog(ui, directory=None, root="", rlog=True, cache=None):

99

'''Collect the CVS rlog'''

99

'''Collect the CVS rlog'''

100

101

# Because we store many duplicate commit log messages, reusing strings

101

# Because we store many duplicate commit log messages, reusing strings

102

# saves a lot of memory and pickle storage space.

102

# saves a lot of memory and pickle storage space.

103

_scache = {}

103

_scache = {}

104

def scache(s):

104

def scache(s):

105

"return a shared version of a string"

105

"return a shared version of a string"

106

return _scache.setdefault(s, s)

106

return _scache.setdefault(s, s)

107

108

ui.status(_('collecting CVS rlog\n'))

108

ui.status(_('collecting CVS rlog\n'))

109

110

log = [] # list of logentry objects containing the CVS state

110

log = [] # list of logentry objects containing the CVS state

111

112

# patterns to match in CVS (r)log output, by state of use

112

# patterns to match in CVS (r)log output, by state of use

113

re_00 = re.compile('RCS file: (.+)$')

113

re_00 = re.compile(b'RCS file: (.+)$')

114

re_01 = re.compile('cvs \\[r?log aborted\\]: (.+)$')

114

re_01 = re.compile(b'cvs \\[r?log aborted\\]: (.+)$')

115

re_02 = re.compile('cvs (r?log|server): (.+)\n$')

115

re_02 = re.compile(b'cvs (r?log|server): (.+)\n$')

116

re_03 = re.compile("(Cannot access.+CVSROOT)|"

116

re_03 = re.compile(b"(Cannot access.+CVSROOT)|"

117

"(can't create temporary directory.+)$")

117

b"(can't create temporary directory.+)$")

118

re_10 = re.compile('Working file: (.+)$')

118

re_10 = re.compile(b'Working file: (.+)$')

119

re_20 = re.compile('symbolic names:')

119

re_20 = re.compile(b'symbolic names:')

120

re_30 = re.compile('\t(.+): ([\\d.]+)$')

120

re_30 = re.compile(b'\t(.+): ([\\d.]+)$')

121

re_31 = re.compile('----------------------------$')

121

re_31 = re.compile(b'----------------------------$')

122

re_32 = re.compile('======================================='

122

re_32 = re.compile(b'======================================='

123

'======================================$')

123

b'======================================$')

124

re_50 = re.compile('revision ([\\d.]+)(\s+locked by:\s+.+;)?$')

124

re_50 = re.compile(b'revision ([\\d.]+)(\s+locked by:\s+.+;)?$')

125

re_60 = re.compile(r'date:\s+(.+);\s+author:\s+(.+);\s+state:\s+(.+?);'

125

re_60 = re.compile(br'date:\s+(.+);\s+author:\s+(.+);\s+state:\s+(.+?);'

126

r'(\s+lines:\s+(\+\d+)?\s+(-\d+)?;)?'

126

br'(\s+lines:\s+(\+\d+)?\s+(-\d+)?;)?'

127

r'(\s+commitid:\s+([^;]+);)?'

127

br'(\s+commitid:\s+([^;]+);)?'

128

r'(.*mergepoint:\s+([^;]+);)?')

128

br'(.*mergepoint:\s+([^;]+);)?')

129

re_70 = re.compile('branches: (.+);$')

129

re_70 = re.compile(b'branches: (.+);$')

130

131

file_added_re = re.compile(r'file [^/]+ was (initially )?added on branch')

131

file_added_re = re.compile(br'file [^/]+ was (initially )?added on branch')

132

133

prefix = '' # leading path to strip of what we get from CVS

133

prefix = '' # leading path to strip of what we get from CVS

134

135

if directory is None:

135

if directory is None:

136

# Current working directory

136

# Current working directory

137

138

# Get the real directory in the repository

138

# Get the real directory in the repository

139

try:

139

try:

140

prefix = open(os.path.join('CVS','Repository'), 'rb').read().strip()

140

prefix = open(os.path.join('CVS','Repository'), 'rb').read().strip()

141

directory = prefix

141

directory = prefix

142

if prefix == ".":

142

if prefix == ".":

143

prefix = ""

143

prefix = ""

144

except IOError:

144

except IOError:

145

raise logerror(_('not a CVS sandbox'))

145

raise logerror(_('not a CVS sandbox'))

146

147

if prefix and not prefix.endswith(pycompat.ossep):

147

if prefix and not prefix.endswith(pycompat.ossep):

148

prefix += pycompat.ossep

148

prefix += pycompat.ossep

149

150

# Use the Root file in the sandbox, if it exists

150

# Use the Root file in the sandbox, if it exists

151

try:

151

try:

152

root = open(os.path.join('CVS','Root'), 'rb').read().strip()

152

root = open(os.path.join('CVS','Root'), 'rb').read().strip()

153

except IOError:

153

except IOError:

154

pass

154

pass

155

156

if not root:

156

if not root:

157

root = encoding.environ.get('CVSROOT', '')

157

root = encoding.environ.get('CVSROOT', '')

158

159

# read log cache if one exists

159

# read log cache if one exists

160

oldlog = []

160

oldlog = []

161

date = None

161

date = None

162

163

if cache:

163

if cache:

164

cachedir = os.path.expanduser('~/.hg.cvsps')

164

cachedir = os.path.expanduser('~/.hg.cvsps')

165

if not os.path.exists(cachedir):

165

if not os.path.exists(cachedir):

166

os.mkdir(cachedir)

166

os.mkdir(cachedir)

167

168

# The cvsps cache pickle needs a uniquified name, based on the

168

# The cvsps cache pickle needs a uniquified name, based on the

169

# repository location. The address may have all sort of nasties

169

# repository location. The address may have all sort of nasties

170

# in it, slashes, colons and such. So here we take just the

170

# in it, slashes, colons and such. So here we take just the

171

# alphanumeric characters, concatenated in a way that does not

171

# alphanumeric characters, concatenated in a way that does not

172

# mix up the various components, so that

172

# mix up the various components, so that

173

# :pserver:user@server:/path

173

# :pserver:user@server:/path

174

# and

174

# and

175

# /pserver/user/server/path

175

# /pserver/user/server/path

176

# are mapped to different cache file names.

176

# are mapped to different cache file names.

177

cachefile = root.split(":") + [directory, "cache"]

177

cachefile = root.split(":") + [directory, "cache"]

178

cachefile = ['-'.join(re.findall(br'\w+', s)) for s in cachefile if s]

178

cachefile = ['-'.join(re.findall(br'\w+', s)) for s in cachefile if s]

179

cachefile = os.path.join(cachedir,

179

cachefile = os.path.join(cachedir,

180

'.'.join([s for s in cachefile if s]))

180

'.'.join([s for s in cachefile if s]))

181

182

if cache == 'update':

182

if cache == 'update':

183

try:

183

try:

184

ui.note(_('reading cvs log cache %s\n') % cachefile)

184

ui.note(_('reading cvs log cache %s\n') % cachefile)

185

oldlog = pickle.load(open(cachefile, 'rb'))

185

oldlog = pickle.load(open(cachefile, 'rb'))

186

for e in oldlog:

186

for e in oldlog:

187

if not (util.safehasattr(e, 'branchpoints') and

187

if not (util.safehasattr(e, 'branchpoints') and

188

util.safehasattr(e, 'commitid') and

188

util.safehasattr(e, 'commitid') and

189

util.safehasattr(e, 'mergepoint')):

189

util.safehasattr(e, 'mergepoint')):

190

ui.status(_('ignoring old cache\n'))

190

ui.status(_('ignoring old cache\n'))

191

oldlog = []

191

oldlog = []

192

break

192

break

193

194

ui.note(_('cache has %d log entries\n') % len(oldlog))

194

ui.note(_('cache has %d log entries\n') % len(oldlog))

195

except Exception as e:

195

except Exception as e:

196

ui.note(_('error reading cache: %r\n') % e)

196

ui.note(_('error reading cache: %r\n') % e)

197

198

if oldlog:

198

if oldlog:

199

date = oldlog[-1].date # last commit date as a (time,tz) tuple

199

date = oldlog[-1].date # last commit date as a (time,tz) tuple

200

date = dateutil.datestr(date, '%Y/%m/%d %H:%M:%S %1%2')

200

date = dateutil.datestr(date, '%Y/%m/%d %H:%M:%S %1%2')

201

202

# build the CVS commandline

202

# build the CVS commandline

203

cmd = ['cvs', '-q']

203

cmd = ['cvs', '-q']

204

if root:

204

if root:

205

cmd.append('-d%s' % root)

205

cmd.append('-d%s' % root)

206

p = util.normpath(getrepopath(root))

206

p = util.normpath(getrepopath(root))

207

if not p.endswith('/'):

207

if not p.endswith('/'):

208

p += '/'

208

p += '/'

209

if prefix:

209

if prefix:

210

# looks like normpath replaces "" by "."

210

# looks like normpath replaces "" by "."

211

prefix = p + util.normpath(prefix)

211

prefix = p + util.normpath(prefix)

212

else:

212

else:

213

prefix = p

213

prefix = p

214

cmd.append(['log', 'rlog'][rlog])

214

cmd.append(['log', 'rlog'][rlog])

215

if date:

215

if date:

216

# no space between option and date string

216

# no space between option and date string

217

cmd.append('-d>%s' % date)

217

cmd.append('-d>%s' % date)

218

cmd.append(directory)

218

cmd.append(directory)

219

220

# state machine begins here

220

# state machine begins here

221

tags = {} # dictionary of revisions on current file with their tags

221

tags = {} # dictionary of revisions on current file with their tags

222

branchmap = {} # mapping between branch names and revision numbers

222

branchmap = {} # mapping between branch names and revision numbers

223

rcsmap = {}

223

rcsmap = {}

224

state = 0

224

state = 0

225

store = False # set when a new record can be appended

225

store = False # set when a new record can be appended

226

227

cmd = [procutil.shellquote(arg) for arg in cmd]

227

cmd = [procutil.shellquote(arg) for arg in cmd]

228

ui.note(_("running %s\n") % (' '.join(cmd)))

228

ui.note(_("running %s\n") % (' '.join(cmd)))

229

ui.debug("prefix=%r directory=%r root=%r\n" % (prefix, directory, root))

229

ui.debug("prefix=%r directory=%r root=%r\n" % (prefix, directory, root))

230

231

pfp = procutil.popen(' '.join(cmd), 'rb')

231

pfp = procutil.popen(' '.join(cmd), 'rb')

232

peek = util.fromnativeeol(pfp.readline())

232

peek = util.fromnativeeol(pfp.readline())

233

while True:

233

while True:

234

line = peek

234

line = peek

235

if line == '':

235

if line == '':

236

break

236

break

237

peek = util.fromnativeeol(pfp.readline())

237

peek = util.fromnativeeol(pfp.readline())

238

if line.endswith('\n'):

238

if line.endswith('\n'):

239

line = line[:-1]

239

line = line[:-1]

240

#ui.debug('state=%d line=%r\n' % (state, line))

240

#ui.debug('state=%d line=%r\n' % (state, line))

241

242

if state == 0:

242

if state == 0:

243

# initial state, consume input until we see 'RCS file'

243

# initial state, consume input until we see 'RCS file'

244

match = re_00.match(line)

244

match = re_00.match(line)

245

if match:

245

if match:

246

rcs = match.group(1)

246

rcs = match.group(1)

247

tags = {}

247

tags = {}

248

if rlog:

248

if rlog:

249

filename = util.normpath(rcs[:-2])

249

filename = util.normpath(rcs[:-2])

250

if filename.startswith(prefix):

250

if filename.startswith(prefix):

251

filename = filename[len(prefix):]

251

filename = filename[len(prefix):]

252

if filename.startswith('/'):

252

if filename.startswith('/'):

253

filename = filename[1:]

253

filename = filename[1:]

254

if filename.startswith('Attic/'):

254

if filename.startswith('Attic/'):

255

filename = filename[6:]

255

filename = filename[6:]

256

else:

256

else:

257

filename = filename.replace('/Attic/', '/')

257

filename = filename.replace('/Attic/', '/')

258

state = 2

258

state = 2

259

continue

259

continue

260

state = 1

260

state = 1

261

continue

261

continue

262

match = re_01.match(line)

262

match = re_01.match(line)

263

if match:

263

if match:

264

raise logerror(match.group(1))

264

raise logerror(match.group(1))

265

match = re_02.match(line)

265

match = re_02.match(line)

266

if match:

266

if match:

267

raise logerror(match.group(2))

267

raise logerror(match.group(2))

268

if re_03.match(line):

268

if re_03.match(line):

269

raise logerror(line)

269

raise logerror(line)

270

271

elif state == 1:

271

elif state == 1:

272

# expect 'Working file' (only when using log instead of rlog)

272

# expect 'Working file' (only when using log instead of rlog)

273

match = re_10.match(line)

273

match = re_10.match(line)

274

assert match, _('RCS file must be followed by working file')

274

assert match, _('RCS file must be followed by working file')

275

filename = util.normpath(match.group(1))

275

filename = util.normpath(match.group(1))

276

state = 2

276

state = 2

277

278

elif state == 2:

278

elif state == 2:

279

# expect 'symbolic names'

279

# expect 'symbolic names'

280

if re_20.match(line):

280

if re_20.match(line):

281

branchmap = {}

281

branchmap = {}

282

state = 3

282

state = 3

283

284

elif state == 3:

284

elif state == 3:

285

# read the symbolic names and store as tags

285

# read the symbolic names and store as tags

286

match = re_30.match(line)

286

match = re_30.match(line)

287

if match:

287

if match:

288

rev = [int(x) for x in match.group(2).split('.')]

288

rev = [int(x) for x in match.group(2).split('.')]

289

290

# Convert magic branch number to an odd-numbered one

290

# Convert magic branch number to an odd-numbered one

291

revn = len(rev)

291

revn = len(rev)

292

if revn > 3 and (revn % 2) == 0 and rev[-2] == 0:

292

if revn > 3 and (revn % 2) == 0 and rev[-2] == 0:

293

rev = rev[:-2] + rev[-1:]

293

rev = rev[:-2] + rev[-1:]

294

rev = tuple(rev)

294

rev = tuple(rev)

295

296

if rev not in tags:

296

if rev not in tags:

297

tags[rev] = []

297

tags[rev] = []

298

tags[rev].append(match.group(1))

298

tags[rev].append(match.group(1))

299

branchmap[match.group(1)] = match.group(2)

299

branchmap[match.group(1)] = match.group(2)

300

301

elif re_31.match(line):

301

elif re_31.match(line):

302

state = 5

302

state = 5

303

elif re_32.match(line):

303

elif re_32.match(line):

304

state = 0

304

state = 0

305

306

elif state == 4:

306

elif state == 4:

307

# expecting '------' separator before first revision

307

# expecting '------' separator before first revision

308

if re_31.match(line):

308

if re_31.match(line):

309

state = 5

309

state = 5

310

else:

310

else:

311

assert not re_32.match(line), _('must have at least '

311

assert not re_32.match(line), _('must have at least '

312

'some revisions')

312

'some revisions')

313

314

elif state == 5:

314

elif state == 5:

315

# expecting revision number and possibly (ignored) lock indication

315

# expecting revision number and possibly (ignored) lock indication

316

# we create the logentry here from values stored in states 0 to 4,

316

# we create the logentry here from values stored in states 0 to 4,

317

# as this state is re-entered for subsequent revisions of a file.

317

# as this state is re-entered for subsequent revisions of a file.

318

match = re_50.match(line)

318

match = re_50.match(line)

319

assert match, _('expected revision number')

319

assert match, _('expected revision number')

320

e = logentry(rcs=scache(rcs),

320

e = logentry(rcs=scache(rcs),

321

file=scache(filename),

321

file=scache(filename),

322

revision=tuple([int(x) for x in

322

revision=tuple([int(x) for x in

323

match.group(1).split('.')]),

323

match.group(1).split('.')]),

324

branches=[],

324

branches=[],

325

parent=None,

325

parent=None,

326

commitid=None,

326

commitid=None,

327

mergepoint=None,

327

mergepoint=None,

328

branchpoints=set())

328

branchpoints=set())

329

330

state = 6

330

state = 6

331

332

elif state == 6:

332

elif state == 6:

333

# expecting date, author, state, lines changed

333

# expecting date, author, state, lines changed

334

match = re_60.match(line)

334

match = re_60.match(line)

335

assert match, _('revision must be followed by date line')

335

assert match, _('revision must be followed by date line')

336

d = match.group(1)

336

d = match.group(1)

337

if d[2] == '/':

337

if d[2] == '/':

338

# Y2K

338

# Y2K

339

d = '19' + d

339

d = '19' + d

340

341

if len(d.split()) != 3:

341

if len(d.split()) != 3:

342

# cvs log dates always in GMT

342

# cvs log dates always in GMT

343

d = d + ' UTC'

343

d = d + ' UTC'

344

e.date = dateutil.parsedate(d, ['%y/%m/%d %H:%M:%S',

344

e.date = dateutil.parsedate(d, ['%y/%m/%d %H:%M:%S',

345

'%Y/%m/%d %H:%M:%S',

345

'%Y/%m/%d %H:%M:%S',

346

'%Y-%m-%d %H:%M:%S'])

346

'%Y-%m-%d %H:%M:%S'])

347

e.author = scache(match.group(2))

347

e.author = scache(match.group(2))

348

e.dead = match.group(3).lower() == 'dead'

348

e.dead = match.group(3).lower() == 'dead'

349

350

if match.group(5):

350

if match.group(5):

351

if match.group(6):

351

if match.group(6):

352

e.lines = (int(match.group(5)), int(match.group(6)))

352

e.lines = (int(match.group(5)), int(match.group(6)))

353

else:

353

else:

354

e.lines = (int(match.group(5)), 0)

354

e.lines = (int(match.group(5)), 0)

355

elif match.group(6):

355

elif match.group(6):

356

e.lines = (0, int(match.group(6)))

356

e.lines = (0, int(match.group(6)))

357

else:

357

else:

358

e.lines = None

358

e.lines = None

359

360

if match.group(7): # cvs 1.12 commitid

360

if match.group(7): # cvs 1.12 commitid

361

e.commitid = match.group(8)

361

e.commitid = match.group(8)

362

363

if match.group(9): # cvsnt mergepoint

363

if match.group(9): # cvsnt mergepoint

364

myrev = match.group(10).split('.')

364

myrev = match.group(10).split('.')

365

if len(myrev) == 2: # head

365

if len(myrev) == 2: # head

366

e.mergepoint = 'HEAD'

366

e.mergepoint = 'HEAD'

367

else:

367

else:

368

myrev = '.'.join(myrev[:-2] + ['0', myrev[-2]])

368

myrev = '.'.join(myrev[:-2] + ['0', myrev[-2]])

369

branches = [b for b in branchmap if branchmap[b] == myrev]

369

branches = [b for b in branchmap if branchmap[b] == myrev]

370

assert len(branches) == 1, ('unknown branch: %s'

370

assert len(branches) == 1, ('unknown branch: %s'

371

% e.mergepoint)

371

% e.mergepoint)

372

e.mergepoint = branches[0]

372

e.mergepoint = branches[0]

373

374

e.comment = []

374

e.comment = []

375

state = 7

375

state = 7

376

377

elif state == 7:

377

elif state == 7:

378

# read the revision numbers of branches that start at this revision

378

# read the revision numbers of branches that start at this revision

379

# or store the commit log message otherwise

379

# or store the commit log message otherwise

380

m = re_70.match(line)

380

m = re_70.match(line)

381

if m:

381

if m:

382

e.branches = [tuple([int(y) for y in x.strip().split('.')])

382

e.branches = [tuple([int(y) for y in x.strip().split('.')])

383

for x in m.group(1).split(';')]

383

for x in m.group(1).split(';')]

384

state = 8

384

state = 8

385

elif re_31.match(line) and re_50.match(peek):

385

elif re_31.match(line) and re_50.match(peek):

386

state = 5

386

state = 5

387

store = True

387

store = True

388

elif re_32.match(line):

388

elif re_32.match(line):

389

state = 0

389

state = 0

390

store = True

390

store = True

391

else:

391

else:

392

e.comment.append(line)

392

e.comment.append(line)

393

394

elif state == 8:

394

elif state == 8:

395

# store commit log message

395

# store commit log message

396

if re_31.match(line):

396

if re_31.match(line):

397

cpeek = peek

397

cpeek = peek

398

if cpeek.endswith('\n'):

398

if cpeek.endswith('\n'):

399

cpeek = cpeek[:-1]

399

cpeek = cpeek[:-1]

400

if re_50.match(cpeek):

400

if re_50.match(cpeek):

401

state = 5

401

state = 5

402

store = True

402

store = True

403

else:

403

else:

404

e.comment.append(line)

404

e.comment.append(line)

405

elif re_32.match(line):

405

elif re_32.match(line):

406

state = 0

406

state = 0

407

store = True

407

store = True

408

else:

408

else:

409

e.comment.append(line)

409

e.comment.append(line)

410

411

# When a file is added on a branch B1, CVS creates a synthetic

411

# When a file is added on a branch B1, CVS creates a synthetic

412

# dead trunk revision 1.1 so that the branch has a root.

412

# dead trunk revision 1.1 so that the branch has a root.

413

# Likewise, if you merge such a file to a later branch B2 (one

413

# Likewise, if you merge such a file to a later branch B2 (one

414

# that already existed when the file was added on B1), CVS

414

# that already existed when the file was added on B1), CVS

415

# creates a synthetic dead revision 1.1.x.1 on B2. Don't drop

415

# creates a synthetic dead revision 1.1.x.1 on B2. Don't drop

416

# these revisions now, but mark them synthetic so

416

# these revisions now, but mark them synthetic so

417

# createchangeset() can take care of them.

417

# createchangeset() can take care of them.

418

if (store and

418

if (store and

419

e.dead and

419

e.dead and

420

e.revision[-1] == 1 and # 1.1 or 1.1.x.1

420

e.revision[-1] == 1 and # 1.1 or 1.1.x.1

421

len(e.comment) == 1 and

421

len(e.comment) == 1 and

422

file_added_re.match(e.comment[0])):

422

file_added_re.match(e.comment[0])):

423

ui.debug('found synthetic revision in %s: %r\n'

423

ui.debug('found synthetic revision in %s: %r\n'

424

% (e.rcs, e.comment[0]))

424

% (e.rcs, e.comment[0]))

425

e.synthetic = True

425

e.synthetic = True

426

427

if store:

427

if store:

428

# clean up the results and save in the log.

428

# clean up the results and save in the log.

429

store = False

429

store = False

430

e.tags = sorted([scache(x) for x in tags.get(e.revision, [])])

430

e.tags = sorted([scache(x) for x in tags.get(e.revision, [])])

431

e.comment = scache('\n'.join(e.comment))

431

e.comment = scache('\n'.join(e.comment))

432

433

revn = len(e.revision)

433

revn = len(e.revision)

434

if revn > 3 and (revn % 2) == 0:

434

if revn > 3 and (revn % 2) == 0:

435

e.branch = tags.get(e.revision[:-1], [None])[0]

435

e.branch = tags.get(e.revision[:-1], [None])[0]

436

else:

436

else:

437

e.branch = None

437

e.branch = None

438

439

# find the branches starting from this revision

439

# find the branches starting from this revision

440

branchpoints = set()

440

branchpoints = set()

441

for branch, revision in branchmap.iteritems():

441

for branch, revision in branchmap.iteritems():

442

revparts = tuple([int(i) for i in revision.split('.')])

442

revparts = tuple([int(i) for i in revision.split('.')])

443

if len(revparts) < 2: # bad tags

443

if len(revparts) < 2: # bad tags

444

continue

444

continue

445

if revparts[-2] == 0 and revparts[-1] % 2 == 0:

445

if revparts[-2] == 0 and revparts[-1] % 2 == 0:

446

# normal branch

446

# normal branch

447

if revparts[:-2] == e.revision:

447

if revparts[:-2] == e.revision:

448

branchpoints.add(branch)

448

branchpoints.add(branch)

449

elif revparts == (1, 1, 1): # vendor branch

449

elif revparts == (1, 1, 1): # vendor branch

450

if revparts in e.branches:

450

if revparts in e.branches:

451

branchpoints.add(branch)

451

branchpoints.add(branch)

452

e.branchpoints = branchpoints

452

e.branchpoints = branchpoints

453

454

log.append(e)

454

log.append(e)

455

456

rcsmap[e.rcs.replace('/Attic/', '/')] = e.rcs

456

rcsmap[e.rcs.replace('/Attic/', '/')] = e.rcs

457

458

if len(log) % 100 == 0:

458

if len(log) % 100 == 0:

459

ui.status(stringutil.ellipsis('%d %s' % (len(log), e.file), 80)

459

ui.status(stringutil.ellipsis('%d %s' % (len(log), e.file), 80)

460

+ '\n')

460

+ '\n')

461

462

log.sort(key=lambda x: (x.rcs, x.revision))

462

log.sort(key=lambda x: (x.rcs, x.revision))

463

464

# find parent revisions of individual files

464

# find parent revisions of individual files

465

versions = {}

465

versions = {}

466

for e in sorted(oldlog, key=lambda x: (x.rcs, x.revision)):

466

for e in sorted(oldlog, key=lambda x: (x.rcs, x.revision)):

467

rcs = e.rcs.replace('/Attic/', '/')

467

rcs = e.rcs.replace('/Attic/', '/')

468

if rcs in rcsmap:

468

if rcs in rcsmap:

469

e.rcs = rcsmap[rcs]

469

e.rcs = rcsmap[rcs]

470

branch = e.revision[:-1]

470

branch = e.revision[:-1]

471

versions[(e.rcs, branch)] = e.revision

471

versions[(e.rcs, branch)] = e.revision

472

473

for e in log:

473

for e in log:

474

branch = e.revision[:-1]

474

branch = e.revision[:-1]

475

p = versions.get((e.rcs, branch), None)

475

p = versions.get((e.rcs, branch), None)

476

if p is None:

476

if p is None:

477

p = e.revision[:-2]

477

p = e.revision[:-2]

478

e.parent = p

478

e.parent = p

479

versions[(e.rcs, branch)] = e.revision

479

versions[(e.rcs, branch)] = e.revision

480

481

# update the log cache

481

# update the log cache

482

if cache:

482

if cache:

483

if log:

483

if log:

484

# join up the old and new logs

484

# join up the old and new logs

485

log.sort(key=lambda x: x.date)

485

log.sort(key=lambda x: x.date)

486

487

if oldlog and oldlog[-1].date >= log[0].date:

487

if oldlog and oldlog[-1].date >= log[0].date:

488

raise logerror(_('log cache overlaps with new log entries,'

488

raise logerror(_('log cache overlaps with new log entries,'

489

' re-run without cache.'))

489

' re-run without cache.'))

490

491

log = oldlog + log

491

log = oldlog + log

492

493

# write the new cachefile

493

# write the new cachefile

494

ui.note(_('writing cvs log cache %s\n') % cachefile)

494

ui.note(_('writing cvs log cache %s\n') % cachefile)

495

pickle.dump(log, open(cachefile, 'wb'))

495

pickle.dump(log, open(cachefile, 'wb'))

496

else:

496

else:

497

log = oldlog

497

log = oldlog

498

499

ui.status(_('%d log entries\n') % len(log))

499

ui.status(_('%d log entries\n') % len(log))

500

501

encodings = ui.configlist('convert', 'cvsps.logencoding')

501

encodings = ui.configlist('convert', 'cvsps.logencoding')

502

if encodings:

502

if encodings:

503

def revstr(r):

503

def revstr(r):

504

# this is needed, because logentry.revision is a tuple of "int"

504

# this is needed, because logentry.revision is a tuple of "int"

505

# (e.g. (1, 2) for "1.2")

505

# (e.g. (1, 2) for "1.2")

506

return '.'.join(pycompat.maplist(pycompat.bytestr, r))

506

return '.'.join(pycompat.maplist(pycompat.bytestr, r))

507

508

for entry in log:

508

for entry in log:

509

comment = entry.comment

509

comment = entry.comment

510

for e in encodings:

510

for e in encodings:

511

try:

511

try:

512

entry.comment = comment.decode(e).encode('utf-8')

512

entry.comment = comment.decode(e).encode('utf-8')

513

if ui.debugflag:

513

if ui.debugflag:

514

ui.debug("transcoding by %s: %s of %s\n" %

514

ui.debug("transcoding by %s: %s of %s\n" %

515

(e, revstr(entry.revision), entry.file))

515

(e, revstr(entry.revision), entry.file))

516

break

516

break

517

except UnicodeDecodeError:

517

except UnicodeDecodeError:

518

pass # try next encoding

518

pass # try next encoding

519

except LookupError as inst: # unknown encoding, maybe

519

except LookupError as inst: # unknown encoding, maybe

520

raise error.Abort(inst,

520

raise error.Abort(inst,

521

hint=_('check convert.cvsps.logencoding'

521

hint=_('check convert.cvsps.logencoding'

522

' configuration'))

522

' configuration'))

523

else:

523

else:

524

raise error.Abort(_("no encoding can transcode"

524

raise error.Abort(_("no encoding can transcode"

525

" CVS log message for %s of %s")

525

" CVS log message for %s of %s")

526

% (revstr(entry.revision), entry.file),

526

% (revstr(entry.revision), entry.file),

527

hint=_('check convert.cvsps.logencoding'

527

hint=_('check convert.cvsps.logencoding'

528

' configuration'))

528

' configuration'))

529

530

hook.hook(ui, None, "cvslog", True, log=log)

530

hook.hook(ui, None, "cvslog", True, log=log)

531

532

return log

532

return log

533

534

535

class changeset(object):

535

class changeset(object):

536

'''Class changeset has the following attributes:

536

'''Class changeset has the following attributes:

537

.id - integer identifying this changeset (list index)

537

.id - integer identifying this changeset (list index)

538

.author - author name as CVS knows it

538

.author - author name as CVS knows it

539

.branch - name of branch this changeset is on, or None

539

.branch - name of branch this changeset is on, or None

540

.comment - commit message

540

.comment - commit message

541

.commitid - CVS commitid or None

541

.commitid - CVS commitid or None

542

.date - the commit date as a (time,tz) tuple

542

.date - the commit date as a (time,tz) tuple

543

.entries - list of logentry objects in this changeset

543

.entries - list of logentry objects in this changeset

544

.parents - list of one or two parent changesets

544

.parents - list of one or two parent changesets

545

.tags - list of tags on this changeset

545

.tags - list of tags on this changeset

546

.synthetic - from synthetic revision "file ... added on branch ..."

546

.synthetic - from synthetic revision "file ... added on branch ..."

547

.mergepoint- the branch that has been merged from or None

547

.mergepoint- the branch that has been merged from or None

548

.branchpoints- the branches that start at the current entry or empty

548

.branchpoints- the branches that start at the current entry or empty

549

'''

549

'''

550

def __init__(self, **entries):

550

def __init__(self, **entries):

551

self.id = None

551

self.id = None

552

self.synthetic = False

552

self.synthetic = False

553

self.__dict__.update(entries)

553

self.__dict__.update(entries)

554

555

def __repr__(self):

555

def __repr__(self):

556

items = ("%s=%r"%(k, self.__dict__[k]) for k in sorted(self.__dict__))

556

items = ("%s=%r"%(k, self.__dict__[k]) for k in sorted(self.__dict__))

557

return "%s(%s)"%(type(self).__name__, ", ".join(items))

557

return "%s(%s)"%(type(self).__name__, ", ".join(items))

558

559

def createchangeset(ui, log, fuzz=60, mergefrom=None, mergeto=None):

559

def createchangeset(ui, log, fuzz=60, mergefrom=None, mergeto=None):

560

'''Convert log into changesets.'''

560

'''Convert log into changesets.'''

561

562

ui.status(_('creating changesets\n'))

562

ui.status(_('creating changesets\n'))

563

564

# try to order commitids by date

564

# try to order commitids by date

565

mindate = {}

565

mindate = {}

566

for e in log:

566

for e in log:

567

if e.commitid:

567

if e.commitid:

568

mindate[e.commitid] = min(e.date, mindate.get(e.commitid))

568

mindate[e.commitid] = min(e.date, mindate.get(e.commitid))

569

570

# Merge changesets

570

# Merge changesets

571

log.sort(key=lambda x: (mindate.get(x.commitid), x.commitid, x.comment,

571

log.sort(key=lambda x: (mindate.get(x.commitid), x.commitid, x.comment,

572

x.author, x.branch, x.date, x.branchpoints))

572

x.author, x.branch, x.date, x.branchpoints))

573

574

changesets = []

574

changesets = []

575

files = set()

575

files = set()

576

c = None

576

c = None

577

for i, e in enumerate(log):

577

for i, e in enumerate(log):

578

579

# Check if log entry belongs to the current changeset or not.

579

# Check if log entry belongs to the current changeset or not.

580

581

# Since CVS is file-centric, two different file revisions with

581

# Since CVS is file-centric, two different file revisions with

582

# different branchpoints should be treated as belonging to two

582

# different branchpoints should be treated as belonging to two

583

# different changesets (and the ordering is important and not

583

# different changesets (and the ordering is important and not

584

# honoured by cvsps at this point).

584

# honoured by cvsps at this point).

585

#

585

#

586

# Consider the following case:

586

# Consider the following case:

587

# foo 1.1 branchpoints: [MYBRANCH]

587

# foo 1.1 branchpoints: [MYBRANCH]

588

# bar 1.1 branchpoints: [MYBRANCH, MYBRANCH2]

588

# bar 1.1 branchpoints: [MYBRANCH, MYBRANCH2]

589

#

589

#

590

# Here foo is part only of MYBRANCH, but not MYBRANCH2, e.g. a

590

# Here foo is part only of MYBRANCH, but not MYBRANCH2, e.g. a

591

# later version of foo may be in MYBRANCH2, so foo should be the

591

# later version of foo may be in MYBRANCH2, so foo should be the

592

# first changeset and bar the next and MYBRANCH and MYBRANCH2

592

# first changeset and bar the next and MYBRANCH and MYBRANCH2

593

# should both start off of the bar changeset. No provisions are

593

# should both start off of the bar changeset. No provisions are

594

# made to ensure that this is, in fact, what happens.

594

# made to ensure that this is, in fact, what happens.

595

if not (c and e.branchpoints == c.branchpoints and

595

if not (c and e.branchpoints == c.branchpoints and

596

(# cvs commitids

596

(# cvs commitids

597

(e.commitid is not None and e.commitid == c.commitid) or

597

(e.commitid is not None and e.commitid == c.commitid) or

598

(# no commitids, use fuzzy commit detection

598

(# no commitids, use fuzzy commit detection

599

(e.commitid is None or c.commitid is None) and

599

(e.commitid is None or c.commitid is None) and

600

e.comment == c.comment and

600

e.comment == c.comment and

601

e.author == c.author and

601

e.author == c.author and

602

e.branch == c.branch and

602

e.branch == c.branch and

603

((c.date[0] + c.date[1]) <=

603

((c.date[0] + c.date[1]) <=

604

(e.date[0] + e.date[1]) <=

604

(e.date[0] + e.date[1]) <=

605

(c.date[0] + c.date[1]) + fuzz) and

605

(c.date[0] + c.date[1]) + fuzz) and

606

e.file not in files))):

606

e.file not in files))):

607

c = changeset(comment=e.comment, author=e.author,

607

c = changeset(comment=e.comment, author=e.author,

608

branch=e.branch, date=e.date,

608

branch=e.branch, date=e.date,

609

entries=[], mergepoint=e.mergepoint,

609

entries=[], mergepoint=e.mergepoint,

610

branchpoints=e.branchpoints, commitid=e.commitid)

610

branchpoints=e.branchpoints, commitid=e.commitid)

611

changesets.append(c)

611

changesets.append(c)

612

613

files = set()

613

files = set()

614

if len(changesets) % 100 == 0:

614

if len(changesets) % 100 == 0:

615

t = '%d %s' % (len(changesets), repr(e.comment)[1:-1])

615

t = '%d %s' % (len(changesets), repr(e.comment)[1:-1])

616

ui.status(stringutil.ellipsis(t, 80) + '\n')

616

ui.status(stringutil.ellipsis(t, 80) + '\n')

617

618

c.entries.append(e)

618

c.entries.append(e)

619

files.add(e.file)

619

files.add(e.file)

620

c.date = e.date # changeset date is date of latest commit in it

620

c.date = e.date # changeset date is date of latest commit in it

621

622

# Mark synthetic changesets

622

# Mark synthetic changesets

623

624

for c in changesets:

624

for c in changesets:

625

# Synthetic revisions always get their own changeset, because

625

# Synthetic revisions always get their own changeset, because

626

# the log message includes the filename. E.g. if you add file3

626

# the log message includes the filename. E.g. if you add file3

627

# and file4 on a branch, you get four log entries and three

627

# and file4 on a branch, you get four log entries and three

628

# changesets:

628

# changesets:

629

# "File file3 was added on branch ..." (synthetic, 1 entry)

629

# "File file3 was added on branch ..." (synthetic, 1 entry)

630

# "File file4 was added on branch ..." (synthetic, 1 entry)

630

# "File file4 was added on branch ..." (synthetic, 1 entry)

631

# "Add file3 and file4 to fix ..." (real, 2 entries)

631

# "Add file3 and file4 to fix ..." (real, 2 entries)

632

# Hence the check for 1 entry here.

632

# Hence the check for 1 entry here.

633

c.synthetic = len(c.entries) == 1 and c.entries[0].synthetic

633

c.synthetic = len(c.entries) == 1 and c.entries[0].synthetic

634

635

# Sort files in each changeset

635

# Sort files in each changeset

636

637

def entitycompare(l, r):

637

def entitycompare(l, r):

638

'Mimic cvsps sorting order'

638

'Mimic cvsps sorting order'

639

l = l.file.split('/')

639

l = l.file.split('/')

640

r = r.file.split('/')

640

r = r.file.split('/')

641

nl = len(l)

641

nl = len(l)

642

nr = len(r)

642

nr = len(r)

643

n = min(nl, nr)

643

n = min(nl, nr)

644

for i in range(n):

644

for i in range(n):

645

if i + 1 == nl and nl < nr:

645

if i + 1 == nl and nl < nr:

646

return -1

646

return -1

647

elif i + 1 == nr and nl > nr:

647

elif i + 1 == nr and nl > nr:

648

return +1

648

return +1

649

elif l[i] < r[i]:

649

elif l[i] < r[i]:

650

return -1

650

return -1

651

elif l[i] > r[i]:

651

elif l[i] > r[i]:

652

return +1

652

return +1

653

return 0

653

return 0

654

655

for c in changesets:

655

for c in changesets:

656

c.entries.sort(entitycompare)

656

c.entries.sort(entitycompare)

657

658

# Sort changesets by date

658

# Sort changesets by date

659

660

odd = set()

660

odd = set()

661

def cscmp(l, r):

661

def cscmp(l, r):

662

d = sum(l.date) - sum(r.date)

662

d = sum(l.date) - sum(r.date)

663

if d:

663

if d:

664

return d

664

return d

665

666

# detect vendor branches and initial commits on a branch

666

# detect vendor branches and initial commits on a branch

667

le = {}

667

le = {}

668

for e in l.entries:

668

for e in l.entries:

669

le[e.rcs] = e.revision

669

le[e.rcs] = e.revision

670

re = {}

670

re = {}

671

for e in r.entries:

671

for e in r.entries:

672

re[e.rcs] = e.revision

672

re[e.rcs] = e.revision

673

674

d = 0

674

d = 0

675

for e in l.entries:

675

for e in l.entries:

676

if re.get(e.rcs, None) == e.parent:

676

if re.get(e.rcs, None) == e.parent:

677

assert not d

677

assert not d

678

d = 1

678

d = 1

679

break

679

break

680

681

for e in r.entries:

681

for e in r.entries:

682

if le.get(e.rcs, None) == e.parent:

682

if le.get(e.rcs, None) == e.parent:

683

if d:

683

if d:

684

odd.add((l, r))

684

odd.add((l, r))

685

d = -1

685

d = -1

686

break

686

break

687

# By this point, the changesets are sufficiently compared that

687

# By this point, the changesets are sufficiently compared that

688

# we don't really care about ordering. However, this leaves

688

# we don't really care about ordering. However, this leaves

689

# some race conditions in the tests, so we compare on the

689

# some race conditions in the tests, so we compare on the

690

# number of files modified, the files contained in each

690

# number of files modified, the files contained in each

691

# changeset, and the branchpoints in the change to ensure test

691

# changeset, and the branchpoints in the change to ensure test

692

# output remains stable.

692

# output remains stable.

693

694

# recommended replacement for cmp from

694

# recommended replacement for cmp from

695

# https://docs.python.org/3.0/whatsnew/3.0.html

695

# https://docs.python.org/3.0/whatsnew/3.0.html

696

c = lambda x, y: (x > y) - (x < y)

696

c = lambda x, y: (x > y) - (x < y)

697

# Sort bigger changes first.

697

# Sort bigger changes first.

698

if not d:

698

if not d:

699

d = c(len(l.entries), len(r.entries))

699

d = c(len(l.entries), len(r.entries))

700

# Try sorting by filename in the change.

700

# Try sorting by filename in the change.

701

if not d:

701

if not d:

702

d = c([e.file for e in l.entries], [e.file for e in r.entries])

702

d = c([e.file for e in l.entries], [e.file for e in r.entries])

703

# Try and put changes without a branch point before ones with

703

# Try and put changes without a branch point before ones with

704

# a branch point.

704

# a branch point.

705

if not d:

705

if not d:

706

d = c(len(l.branchpoints), len(r.branchpoints))

706

d = c(len(l.branchpoints), len(r.branchpoints))

707

return d

707

return d

708

709

changesets.sort(cscmp)

709

changesets.sort(cscmp)

710

711

# Collect tags

711

# Collect tags

712

713

globaltags = {}

713

globaltags = {}

714

for c in changesets:

714

for c in changesets:

715

for e in c.entries:

715

for e in c.entries:

716

for tag in e.tags:

716

for tag in e.tags:

717

# remember which is the latest changeset to have this tag

717

# remember which is the latest changeset to have this tag

718

globaltags[tag] = c

718

globaltags[tag] = c

719

720

for c in changesets:

720

for c in changesets:

721

tags = set()

721

tags = set()

722

for e in c.entries:

722

for e in c.entries:

723

tags.update(e.tags)

723

tags.update(e.tags)

724

# remember tags only if this is the latest changeset to have it

724

# remember tags only if this is the latest changeset to have it

725

c.tags = sorted(tag for tag in tags if globaltags[tag] is c)

725

c.tags = sorted(tag for tag in tags if globaltags[tag] is c)

726

727

# Find parent changesets, handle {{mergetobranch BRANCHNAME}}

727

# Find parent changesets, handle {{mergetobranch BRANCHNAME}}

728

# by inserting dummy changesets with two parents, and handle

728

# by inserting dummy changesets with two parents, and handle

729

# {{mergefrombranch BRANCHNAME}} by setting two parents.

729

# {{mergefrombranch BRANCHNAME}} by setting two parents.

730

731

if mergeto is None:

731

if mergeto is None:

732

mergeto = r'{{mergetobranch ([-\w]+)}}'

732

mergeto = br'{{mergetobranch ([-\w]+)}}'

733

if mergeto:

733

if mergeto:

734

mergeto = re.compile(mergeto)

734

mergeto = re.compile(mergeto)

735

736

if mergefrom is None:

736

if mergefrom is None:

737

mergefrom = r'{{mergefrombranch ([-\w]+)}}'

737

mergefrom = br'{{mergefrombranch ([-\w]+)}}'

738

if mergefrom:

738

if mergefrom:

739

mergefrom = re.compile(mergefrom)

739

mergefrom = re.compile(mergefrom)

740

741

versions = {} # changeset index where we saw any particular file version

741

versions = {} # changeset index where we saw any particular file version

742

branches = {} # changeset index where we saw a branch

742

branches = {} # changeset index where we saw a branch

743

n = len(changesets)

743

n = len(changesets)

744

i = 0

744

i = 0

745

while i < n:

745

while i < n:

746

c = changesets[i]

746

c = changesets[i]

747

748

for f in c.entries:

748

for f in c.entries:

749

versions[(f.rcs, f.revision)] = i

749

versions[(f.rcs, f.revision)] = i

750

751

p = None

751

p = None

752

if c.branch in branches:

752

if c.branch in branches:

753

p = branches[c.branch]

753

p = branches[c.branch]

754

else:

754

else:

755

# first changeset on a new branch

755

# first changeset on a new branch

756

# the parent is a changeset with the branch in its

756

# the parent is a changeset with the branch in its

757

# branchpoints such that it is the latest possible

757

# branchpoints such that it is the latest possible

758

# commit without any intervening, unrelated commits.

758

# commit without any intervening, unrelated commits.

759

760

for candidate in xrange(i):

760

for candidate in xrange(i):

761

if c.branch not in changesets[candidate].branchpoints:

761

if c.branch not in changesets[candidate].branchpoints:

762

if p is not None:

762

if p is not None:

763

break

763

break

764

continue

764

continue

765

p = candidate

765

p = candidate

766

767

c.parents = []

767

c.parents = []

768

if p is not None:

768

if p is not None:

769

p = changesets[p]

769

p = changesets[p]

770

771

# Ensure no changeset has a synthetic changeset as a parent.

771

# Ensure no changeset has a synthetic changeset as a parent.

772

while p.synthetic:

772

while p.synthetic:

773

assert len(p.parents) <= 1, \

773

assert len(p.parents) <= 1, \

774

_('synthetic changeset cannot have multiple parents')

774

_('synthetic changeset cannot have multiple parents')

775

if p.parents:

775

if p.parents:

776

p = p.parents[0]

776

p = p.parents[0]

777

else:

777

else:

778

p = None

778

p = None

779

break

779

break

780

781

if p is not None:

781

if p is not None:

782

c.parents.append(p)

782

c.parents.append(p)

783

784

if c.mergepoint:

784

if c.mergepoint:

785

if c.mergepoint == 'HEAD':

785

if c.mergepoint == 'HEAD':

786

c.mergepoint = None

786

c.mergepoint = None

787

c.parents.append(changesets[branches[c.mergepoint]])

787

c.parents.append(changesets[branches[c.mergepoint]])

788

789

if mergefrom:

789

if mergefrom:

790

m = mergefrom.search(c.comment)

790

m = mergefrom.search(c.comment)

791

if m:

791

if m:

792

m = m.group(1)

792

m = m.group(1)

793

if m == 'HEAD':

793

if m == 'HEAD':

794

m = None

794

m = None

795

try:

795

try:

796

candidate = changesets[branches[m]]

796

candidate = changesets[branches[m]]

797

except KeyError:

797

except KeyError:

798

ui.warn(_("warning: CVS commit message references "

798

ui.warn(_("warning: CVS commit message references "

799

"non-existent branch %r:\n%s\n")

799

"non-existent branch %r:\n%s\n")

800

% (m, c.comment))

800

% (m, c.comment))

801

if m in branches and c.branch != m and not candidate.synthetic:

801

if m in branches and c.branch != m and not candidate.synthetic:

802

c.parents.append(candidate)

802

c.parents.append(candidate)

803

804

if mergeto:

804

if mergeto:

805

m = mergeto.search(c.comment)

805

m = mergeto.search(c.comment)

806

if m:

806

if m:

807

if m.groups():

807

if m.groups():

808

m = m.group(1)

808

m = m.group(1)

809

if m == 'HEAD':

809

if m == 'HEAD':

810

m = None

810

m = None

811

else:

811

else:

812

m = None # if no group found then merge to HEAD

812

m = None # if no group found then merge to HEAD

813

if m in branches and c.branch != m:

813

if m in branches and c.branch != m:

814

# insert empty changeset for merge

814

# insert empty changeset for merge

815

cc = changeset(

815

cc = changeset(

816

author=c.author, branch=m, date=c.date,

816

author=c.author, branch=m, date=c.date,

817

comment='convert-repo: CVS merge from branch %s'

817

comment='convert-repo: CVS merge from branch %s'

818

% c.branch,

818

% c.branch,

819

entries=[], tags=[],

819

entries=[], tags=[],

820

parents=[changesets[branches[m]], c])

820

parents=[changesets[branches[m]], c])

821

changesets.insert(i + 1, cc)

821

changesets.insert(i + 1, cc)

822

branches[m] = i + 1

822

branches[m] = i + 1

823

824

# adjust our loop counters now we have inserted a new entry

824

# adjust our loop counters now we have inserted a new entry

825

n += 1

825

n += 1

826

i += 2

826

i += 2

827

continue

827

continue

828

829

branches[c.branch] = i

829

branches[c.branch] = i

830

i += 1

830

i += 1

831

832

# Drop synthetic changesets (safe now that we have ensured no other

832

# Drop synthetic changesets (safe now that we have ensured no other

833

# changesets can have them as parents).

833

# changesets can have them as parents).

834

i = 0

834

i = 0

835

while i < len(changesets):

835

while i < len(changesets):

836

if changesets[i].synthetic:

836

if changesets[i].synthetic:

837

del changesets[i]

837

del changesets[i]

838

else:

838

else:

839

i += 1

839

i += 1

840

841

# Number changesets

841

# Number changesets

842

843

for i, c in enumerate(changesets):

843

for i, c in enumerate(changesets):

844

c.id = i + 1

844

c.id = i + 1

845

846

if odd:

846

if odd:

847

for l, r in odd:

847

for l, r in odd:

848

if l.id is not None and r.id is not None:

848

if l.id is not None and r.id is not None:

849

ui.warn(_('changeset %d is both before and after %d\n')

849

ui.warn(_('changeset %d is both before and after %d\n')

850

% (l.id, r.id))

850

% (l.id, r.id))

851

852

ui.status(_('%d changeset entries\n') % len(changesets))

852

ui.status(_('%d changeset entries\n') % len(changesets))

853

854

hook.hook(ui, None, "cvschangesets", True, changesets=changesets)

854

hook.hook(ui, None, "cvschangesets", True, changesets=changesets)

855

856

return changesets

856

return changesets

857

858

859

def debugcvsps(ui, *args, **opts):

859

def debugcvsps(ui, *args, **opts):

860

'''Read CVS rlog for current directory or named path in

860

'''Read CVS rlog for current directory or named path in

861

repository, and convert the log to changesets based on matching

861

repository, and convert the log to changesets based on matching

862

commit log entries and dates.

862

commit log entries and dates.

863

'''

863

'''

864

opts = pycompat.byteskwargs(opts)

864

opts = pycompat.byteskwargs(opts)

865

if opts["new_cache"]:

865

if opts["new_cache"]:

866

cache = "write"

866

cache = "write"

867

elif opts["update_cache"]:

867

elif opts["update_cache"]:

868

cache = "update"

868

cache = "update"

869

else:

869

else:

870

cache = None

870

cache = None

871

872

revisions = opts["revisions"]

872

revisions = opts["revisions"]

873

874

try:

874

try:

875

if args:

875

if args:

876

log = []

876

log = []

877

for d in args:

877

for d in args:

878

log += createlog(ui, d, root=opts["root"], cache=cache)

878

log += createlog(ui, d, root=opts["root"], cache=cache)

879

else:

879

else:

880

log = createlog(ui, root=opts["root"], cache=cache)

880

log = createlog(ui, root=opts["root"], cache=cache)

881

except logerror as e:

881

except logerror as e:

882

ui.write("%r\n"%e)

882

ui.write("%r\n"%e)

883

return

883

return

884

885

changesets = createchangeset(ui, log, opts["fuzz"])

885

changesets = createchangeset(ui, log, opts["fuzz"])

886

del log

886

del log

887

888

# Print changesets (optionally filtered)

888

# Print changesets (optionally filtered)

889

890

off = len(revisions)

890

off = len(revisions)

891

branches = {} # latest version number in each branch

891

branches = {} # latest version number in each branch

892

ancestors = {} # parent branch

892

ancestors = {} # parent branch

893

for cs in changesets:

893

for cs in changesets:

894

895

if opts["ancestors"]:

895

if opts["ancestors"]:

896

if cs.branch not in branches and cs.parents and cs.parents[0].id:

896

if cs.branch not in branches and cs.parents and cs.parents[0].id:

897

ancestors[cs.branch] = (changesets[cs.parents[0].id - 1].branch,

897

ancestors[cs.branch] = (changesets[cs.parents[0].id - 1].branch,

898

cs.parents[0].id)

898

cs.parents[0].id)

899

branches[cs.branch] = cs.id

899

branches[cs.branch] = cs.id

900

901

# limit by branches

901

# limit by branches

902

if opts["branches"] and (cs.branch or 'HEAD') not in opts["branches"]:

902

if opts["branches"] and (cs.branch or 'HEAD') not in opts["branches"]:

903

continue

903

continue

904

905

if not off:

905

if not off:

906

# Note: trailing spaces on several lines here are needed to have

906

# Note: trailing spaces on several lines here are needed to have

907

# bug-for-bug compatibility with cvsps.

907

# bug-for-bug compatibility with cvsps.

908

ui.write('---------------------\n')

908

ui.write('---------------------\n')

909

ui.write(('PatchSet %d \n' % cs.id))

909

ui.write(('PatchSet %d \n' % cs.id))

910

ui.write(('Date: %s\n' % dateutil.datestr(cs.date,

910

ui.write(('Date: %s\n' % dateutil.datestr(cs.date,

911

'%Y/%m/%d %H:%M:%S %1%2')))

911

'%Y/%m/%d %H:%M:%S %1%2')))

912

ui.write(('Author: %s\n' % cs.author))

912

ui.write(('Author: %s\n' % cs.author))

913

ui.write(('Branch: %s\n' % (cs.branch or 'HEAD')))

913

ui.write(('Branch: %s\n' % (cs.branch or 'HEAD')))

914

ui.write(('Tag%s: %s \n' % (['', 's'][len(cs.tags) > 1],

914

ui.write(('Tag%s: %s \n' % (['', 's'][len(cs.tags) > 1],

915

','.join(cs.tags) or '(none)')))

915

','.join(cs.tags) or '(none)')))

916

if cs.branchpoints:

916

if cs.branchpoints:

917

ui.write(('Branchpoints: %s \n') %

917

ui.write(('Branchpoints: %s \n') %

918

', '.join(sorted(cs.branchpoints)))

918

', '.join(sorted(cs.branchpoints)))

919

if opts["parents"] and cs.parents:

919

if opts["parents"] and cs.parents:

920

if len(cs.parents) > 1:

920

if len(cs.parents) > 1:

921

ui.write(('Parents: %s\n' %

921

ui.write(('Parents: %s\n' %

922

(','.join([(b"%d" % p.id) for p in cs.parents]))))

922

(','.join([(b"%d" % p.id) for p in cs.parents]))))

923

else:

923

else:

924

ui.write(('Parent: %d\n' % cs.parents[0].id))

924

ui.write(('Parent: %d\n' % cs.parents[0].id))

925

926

if opts["ancestors"]:

926

if opts["ancestors"]:

927

b = cs.branch

927

b = cs.branch

928

r = []

928

r = []

929

while b:

929

while b:

930

b, c = ancestors[b]

930

b, c = ancestors[b]

931

r.append('%s:%d:%d' % (b or "HEAD", c, branches[b]))

931

r.append('%s:%d:%d' % (b or "HEAD", c, branches[b]))

932

if r:

932

if r:

933

ui.write(('Ancestors: %s\n' % (','.join(r))))

933

ui.write(('Ancestors: %s\n' % (','.join(r))))

934

935

ui.write(('Log:\n'))

935

ui.write(('Log:\n'))

936

ui.write('%s\n\n' % cs.comment)

936

ui.write('%s\n\n' % cs.comment)

937

ui.write(('Members: \n'))

937

ui.write(('Members: \n'))

938

for f in cs.entries:

938

for f in cs.entries:

939

fn = f.file

939

fn = f.file

940

if fn.startswith(opts["prefix"]):

940

if fn.startswith(opts["prefix"]):

941

fn = fn[len(opts["prefix"]):]

941

fn = fn[len(opts["prefix"]):]

942

ui.write('\t%s:%s->%s%s \n' % (

942

ui.write('\t%s:%s->%s%s \n' % (

943

fn, '.'.join([str(x) for x in f.parent]) or 'INITIAL',

943

fn, '.'.join([str(x) for x in f.parent]) or 'INITIAL',

944

'.'.join([(b"%d" % x) for x in f.revision]),

944

'.'.join([(b"%d" % x) for x in f.revision]),

945

['', '(DEAD)'][f.dead]))

945

['', '(DEAD)'][f.dead]))

946

ui.write('\n')

946

ui.write('\n')

947

948

# have we seen the start tag?

948

# have we seen the start tag?

949

if revisions and off:

949

if revisions and off:

950

if revisions[0] == (b"%d" % cs.id) or \

950

if revisions[0] == (b"%d" % cs.id) or \

951

revisions[0] in cs.tags:

951

revisions[0] in cs.tags:

952

off = False

952

off = False

953

954

# see if we reached the end tag

954

# see if we reached the end tag

955

if len(revisions) > 1 and not off:

955

if len(revisions) > 1 and not off:

956

if revisions[1] == (b"%d" % cs.id) or \

956

if revisions[1] == (b"%d" % cs.id) or \

957

revisions[1] in cs.tags:

957

revisions[1] in cs.tags:

958

break

958

break

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # Mercurial built-in replacement for cvsps.
             #
             # Copyright 2008, Frank Kingswood <frank@kingswood-consulting.co.uk>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from __future__ import absolute_import
             import os
             import re
             from mercurial.i18n import _
             from mercurial import (
                 encoding,
                 error,
                 hook,
                 pycompat,
                 util,
             )
             from mercurial.utils import (
                 dateutil,
                 procutil,
                 stringutil,
             )
             pickle = util.pickle
             class logentry(object):
                 '''Class logentry has the following attributes:
                     .author    - author name as CVS knows it
                     .branch    - name of branch this revision is on
                     .branches  - revision tuple of branches starting at this revision
                     .comment   - commit message
                     .commitid  - CVS commitid or None
                     .date      - the commit date as a (time, tz) tuple
                     .dead      - true if file revision is dead
                     .file      - Name of file
                     .lines     - a tuple (+lines, -lines) or None
                     .parent    - Previous revision of this entry
                     .rcs       - name of file as returned from CVS
                     .revision  - revision number as tuple
                     .tags      - list of tags on the file
                     .synthetic - is this a synthetic "file ... added on ..." revision?
                     .mergepoint - the branch that has been merged from (if present in
                                   rlog output) or None
                     .branchpoints - the branches that start at the current entry or empty
                 '''
                 def __init__(self, **entries):
                     self.synthetic = False
                     self.__dict__.update(entries)
                 def __repr__(self):
                     items = ("%s=%r"%(k, self.__dict__[k]) for k in sorted(self.__dict__))
                     return "%s(%s)"%(type(self).__name__, ", ".join(items))
             class logerror(Exception):
                 pass
             def getrepopath(cvspath):
                 """Return the repository path from a CVS path.
                 >>> getrepopath(b'/foo/bar')
                 '/foo/bar'
                 >>> getrepopath(b'c:/foo/bar')
                 '/foo/bar'
                 >>> getrepopath(b':pserver:10/foo/bar')
                 '/foo/bar'
                 >>> getrepopath(b':pserver:10c:/foo/bar')
                 '/foo/bar'
                 >>> getrepopath(b':pserver:/foo/bar')
                 '/foo/bar'
                 >>> getrepopath(b':pserver:c:/foo/bar')
                 '/foo/bar'
                 >>> getrepopath(b':pserver:truc@foo.bar:/foo/bar')
                 '/foo/bar'
                 >>> getrepopath(b':pserver:truc@foo.bar:c:/foo/bar')
                 '/foo/bar'
                 >>> getrepopath(b'user@server/path/to/repository')
                 '/path/to/repository'
                 """
                 # According to CVS manual, CVS paths are expressed like:
                 # [:method:][[user][:password]@]hostname[:[port]]/path/to/repository
                 #
                 # CVSpath is splitted into parts and then position of the first occurrence
                 # of the '/' char after the '@' is located. The solution is the rest of the
                 # string after that '/' sign including it
                 parts = cvspath.split(':')
                 atposition = parts[-1].find('@')
                 start = 0
                 if atposition != -1:
                     start = atposition
                 repopath = parts[-1][parts[-1].find('/', start):]
                 return repopath
             def createlog(ui, directory=None, root="", rlog=True, cache=None):
                 '''Collect the CVS rlog'''
                 # Because we store many duplicate commit log messages, reusing strings
                 # saves a lot of memory and pickle storage space.
                 _scache = {}
                 def scache(s):
                     "return a shared version of a string"
                     return _scache.setdefault(s, s)
                 ui.status(_('collecting CVS rlog\n'))
                 log = []      # list of logentry objects containing the CVS state
                 # patterns to match in CVS (r)log output, by state of use
-                re_00 = re.compile('RCS file: (.+)$')
+                re_00 = re.compile(b'RCS file: (.+)$')
-                re_01 = re.compile('cvs \\[r?log aborted\\]: (.+)$')
+                re_01 = re.compile(b'cvs \\[r?log aborted\\]: (.+)$')
-                re_02 = re.compile('cvs (r?log|server): (.+)\n$')
+                re_02 = re.compile(b'cvs (r?log|server): (.+)\n$')
-                re_03 = re.compile("(Cannot access.+CVSROOT)|"
+                re_03 = re.compile(b"(Cannot access.+CVSROOT)|"
-                                   "(can't create temporary directory.+)$")
+                                   b"(can't create temporary directory.+)$")
-                re_10 = re.compile('Working file: (.+)$')
+                re_10 = re.compile(b'Working file: (.+)$')
-                re_20 = re.compile('symbolic names:')
+                re_20 = re.compile(b'symbolic names:')
-                re_30 = re.compile('\t(.+): ([\\d.]+)$')
+                re_30 = re.compile(b'\t(.+): ([\\d.]+)$')
-                re_31 = re.compile('----------------------------$')
+                re_31 = re.compile(b'----------------------------$')
-                re_32 = re.compile('======================================='
+                re_32 = re.compile(b'======================================='
-                                   '======================================$')
+                                   b'======================================$')
-                re_50 = re.compile('revision ([\\d.]+)(\s+locked by:\s+.+;)?$')
+                re_50 = re.compile(b'revision ([\\d.]+)(\s+locked by:\s+.+;)?$')
-                re_60 = re.compile(r'date:\s+(.+);\s+author:\s+(.+);\s+state:\s+(.+?);'
+                re_60 = re.compile(br'date:\s+(.+);\s+author:\s+(.+);\s+state:\s+(.+?);'
-                                   r'(\s+lines:\s+(\+\d+)?\s+(-\d+)?;)?'
+                                   br'(\s+lines:\s+(\+\d+)?\s+(-\d+)?;)?'
-                                   r'(\s+commitid:\s+([^;]+);)?'
+                                   br'(\s+commitid:\s+([^;]+);)?'
-                                   r'(.*mergepoint:\s+([^;]+);)?')
+                                   br'(.*mergepoint:\s+([^;]+);)?')
-                re_70 = re.compile('branches: (.+);$')
+                re_70 = re.compile(b'branches: (.+);$')
-                file_added_re = re.compile(r'file [^/]+ was (initially )?added on branch')
+                file_added_re = re.compile(br'file [^/]+ was (initially )?added on branch')
                 prefix = ''   # leading path to strip of what we get from CVS
                 if directory is None:
                     # Current working directory
                     # Get the real directory in the repository
                     try:
                         prefix = open(os.path.join('CVS','Repository'), 'rb').read().strip()
                         directory = prefix
                         if prefix == ".":
                             prefix = ""
                     except IOError:
                         raise logerror(_('not a CVS sandbox'))
                     if prefix and not prefix.endswith(pycompat.ossep):
                         prefix += pycompat.ossep
                     # Use the Root file in the sandbox, if it exists
                     try:
                         root = open(os.path.join('CVS','Root'), 'rb').read().strip()
                     except IOError:
                         pass
                 if not root:
                     root = encoding.environ.get('CVSROOT', '')
                 # read log cache if one exists
                 oldlog = []
                 date = None
                 if cache:
                     cachedir = os.path.expanduser('~/.hg.cvsps')
                     if not os.path.exists(cachedir):
                         os.mkdir(cachedir)
                     # The cvsps cache pickle needs a uniquified name, based on the
                     # repository location. The address may have all sort of nasties
                     # in it, slashes, colons and such. So here we take just the
                     # alphanumeric characters, concatenated in a way that does not
                     # mix up the various components, so that
                     #    :pserver:user@server:/path
                     # and
                     #    /pserver/user/server/path
                     # are mapped to different cache file names.
                     cachefile = root.split(":") + [directory, "cache"]
                     cachefile = ['-'.join(re.findall(br'\w+', s)) for s in cachefile if s]
                     cachefile = os.path.join(cachedir,
                                              '.'.join([s for s in cachefile if s]))
                 if cache == 'update':
                     try:
                         ui.note(_('reading cvs log cache %s\n') % cachefile)
                         oldlog = pickle.load(open(cachefile, 'rb'))
                         for e in oldlog:
                             if not (util.safehasattr(e, 'branchpoints') and
                                     util.safehasattr(e, 'commitid') and
                                     util.safehasattr(e, 'mergepoint')):
                                 ui.status(_('ignoring old cache\n'))
                                 oldlog = []
                                 break
                         ui.note(_('cache has %d log entries\n') % len(oldlog))
                     except Exception as e:
                         ui.note(_('error reading cache: %r\n') % e)
                     if oldlog:
                         date = oldlog[-1].date    # last commit date as a (time,tz) tuple
                         date = dateutil.datestr(date, '%Y/%m/%d %H:%M:%S %1%2')
                 # build the CVS commandline
                 cmd = ['cvs', '-q']
                 if root:
                     cmd.append('-d%s' % root)
                     p = util.normpath(getrepopath(root))
                     if not p.endswith('/'):
                         p += '/'
                     if prefix:
                         # looks like normpath replaces "" by "."
                         prefix = p + util.normpath(prefix)
                     else:
                         prefix = p
                 cmd.append(['log', 'rlog'][rlog])
                 if date:
                     # no space between option and date string
                     cmd.append('-d>%s' % date)
                 cmd.append(directory)
                 # state machine begins here
                 tags = {}     # dictionary of revisions on current file with their tags
                 branchmap = {} # mapping between branch names and revision numbers
                 rcsmap = {}
                 state = 0
                 store = False # set when a new record can be appended
                 cmd = [procutil.shellquote(arg) for arg in cmd]
                 ui.note(_("running %s\n") % (' '.join(cmd)))
                 ui.debug("prefix=%r directory=%r root=%r\n" % (prefix, directory, root))
                 pfp = procutil.popen(' '.join(cmd), 'rb')
                 peek = util.fromnativeeol(pfp.readline())
                 while True:
                     line = peek
                     if line == '':
                         break
                     peek = util.fromnativeeol(pfp.readline())
                     if line.endswith('\n'):
                         line = line[:-1]
                     #ui.debug('state=%d line=%r\n' % (state, line))
                     if state == 0:
                         # initial state, consume input until we see 'RCS file'
                         match = re_00.match(line)
                         if match:
                             rcs = match.group(1)
                             tags = {}
                             if rlog:
                                 filename = util.normpath(rcs[:-2])
                                 if filename.startswith(prefix):
                                     filename = filename[len(prefix):]
                                 if filename.startswith('/'):
                                     filename = filename[1:]
                                 if filename.startswith('Attic/'):
                                     filename = filename[6:]
                                 else:
                                     filename = filename.replace('/Attic/', '/')
                                 state = 2
                                 continue
                             state = 1
                             continue
                         match = re_01.match(line)
                         if match:
                             raise logerror(match.group(1))
                         match = re_02.match(line)
                         if match:
                             raise logerror(match.group(2))
                         if re_03.match(line):
                             raise logerror(line)
                     elif state == 1:
                         # expect 'Working file' (only when using log instead of rlog)
                         match = re_10.match(line)
                         assert match, _('RCS file must be followed by working file')
                         filename = util.normpath(match.group(1))
                         state = 2
                     elif state == 2:
                         # expect 'symbolic names'
                         if re_20.match(line):
                             branchmap = {}
                             state = 3
                     elif state == 3:
                         # read the symbolic names and store as tags
                         match = re_30.match(line)
                         if match:
                             rev = [int(x) for x in match.group(2).split('.')]
                             # Convert magic branch number to an odd-numbered one
                             revn = len(rev)
                             if revn > 3 and (revn % 2) == 0 and rev[-2] == 0:
                                 rev = rev[:-2] + rev[-1:]
                             rev = tuple(rev)
                             if rev not in tags:
                                 tags[rev] = []
                             tags[rev].append(match.group(1))
                             branchmap[match.group(1)] = match.group(2)
                         elif re_31.match(line):
                             state = 5
                         elif re_32.match(line):
                             state = 0
                     elif state == 4:
                         # expecting '------' separator before first revision
                         if re_31.match(line):
                             state = 5
                         else:
                             assert not re_32.match(line), _('must have at least '
                                                             'some revisions')
                     elif state == 5:
                         # expecting revision number and possibly (ignored) lock indication
                         # we create the logentry here from values stored in states 0 to 4,
                         # as this state is re-entered for subsequent revisions of a file.
                         match = re_50.match(line)
                         assert match, _('expected revision number')
                         e = logentry(rcs=scache(rcs),
                                      file=scache(filename),
                                      revision=tuple([int(x) for x in
                                                      match.group(1).split('.')]),
                                      branches=[],
                                      parent=None,
                                      commitid=None,
                                      mergepoint=None,
                                      branchpoints=set())
                         state = 6
                     elif state == 6:
                         # expecting date, author, state, lines changed
                         match = re_60.match(line)
                         assert match, _('revision must be followed by date line')
                         d = match.group(1)
                         if d[2] == '/':
                             # Y2K
                             d = '19' + d
                         if len(d.split()) != 3:
                             # cvs log dates always in GMT
                             d = d + ' UTC'
                         e.date = dateutil.parsedate(d, ['%y/%m/%d %H:%M:%S',
                                                     '%Y/%m/%d %H:%M:%S',
                                                     '%Y-%m-%d %H:%M:%S'])
                         e.author = scache(match.group(2))
                         e.dead = match.group(3).lower() == 'dead'
                         if match.group(5):
                             if match.group(6):
                                 e.lines = (int(match.group(5)), int(match.group(6)))
                             else:
                                 e.lines = (int(match.group(5)), 0)
                         elif match.group(6):
                             e.lines = (0, int(match.group(6)))
                         else:
                             e.lines = None
                         if match.group(7): # cvs 1.12 commitid
                             e.commitid = match.group(8)
                         if match.group(9): # cvsnt mergepoint
                             myrev = match.group(10).split('.')
                             if len(myrev) == 2: # head
                                 e.mergepoint = 'HEAD'
                             else:
                                 myrev = '.'.join(myrev[:-2] + ['0', myrev[-2]])
                                 branches = [b for b in branchmap if branchmap[b] == myrev]
                                 assert len(branches) == 1, ('unknown branch: %s'
                                                             % e.mergepoint)
                                 e.mergepoint = branches[0]
                         e.comment = []
                         state = 7
                     elif state == 7:
                         # read the revision numbers of branches that start at this revision
                         # or store the commit log message otherwise
                         m = re_70.match(line)
                         if m:
                             e.branches = [tuple([int(y) for y in x.strip().split('.')])
                                             for x in m.group(1).split(';')]
                             state = 8
                         elif re_31.match(line) and re_50.match(peek):
                             state = 5
                             store = True
                         elif re_32.match(line):
                             state = 0
                             store = True
                         else:
                             e.comment.append(line)
                     elif state == 8:
                         # store commit log message
                         if re_31.match(line):
                             cpeek = peek
                             if cpeek.endswith('\n'):
                                 cpeek = cpeek[:-1]
                             if re_50.match(cpeek):
                                 state = 5
                                 store = True
                             else:
                                 e.comment.append(line)
                         elif re_32.match(line):
                             state = 0
                             store = True
                         else:
                             e.comment.append(line)
                     # When a file is added on a branch B1, CVS creates a synthetic
                     # dead trunk revision 1.1 so that the branch has a root.
                     # Likewise, if you merge such a file to a later branch B2 (one
                     # that already existed when the file was added on B1), CVS
                     # creates a synthetic dead revision 1.1.x.1 on B2.  Don't drop
                     # these revisions now, but mark them synthetic so
                     # createchangeset() can take care of them.
                     if (store and
                           e.dead and
                           e.revision[-1] == 1 and      # 1.1 or 1.1.x.1
                           len(e.comment) == 1 and
                           file_added_re.match(e.comment[0])):
                         ui.debug('found synthetic revision in %s: %r\n'
                                  % (e.rcs, e.comment[0]))
                         e.synthetic = True
                     if store:
                         # clean up the results and save in the log.
                         store = False
                         e.tags = sorted([scache(x) for x in tags.get(e.revision, [])])
                         e.comment = scache('\n'.join(e.comment))
                         revn = len(e.revision)
                         if revn > 3 and (revn % 2) == 0:
                             e.branch = tags.get(e.revision[:-1], [None])[0]
                         else:
                             e.branch = None
                         # find the branches starting from this revision
                         branchpoints = set()
                         for branch, revision in branchmap.iteritems():
                             revparts = tuple([int(i) for i in revision.split('.')])
                             if len(revparts) < 2: # bad tags
                                 continue
                             if revparts[-2] == 0 and revparts[-1] % 2 == 0:
                                 # normal branch
                                 if revparts[:-2] == e.revision:
                                     branchpoints.add(branch)
                             elif revparts == (1, 1, 1): # vendor branch
                                 if revparts in e.branches:
                                     branchpoints.add(branch)
                         e.branchpoints = branchpoints
                         log.append(e)
                         rcsmap[e.rcs.replace('/Attic/', '/')] = e.rcs
                         if len(log) % 100 == 0:
                             ui.status(stringutil.ellipsis('%d %s' % (len(log), e.file), 80)
                                       + '\n')
                 log.sort(key=lambda x: (x.rcs, x.revision))
                 # find parent revisions of individual files
                 versions = {}
                 for e in sorted(oldlog, key=lambda x: (x.rcs, x.revision)):
                     rcs = e.rcs.replace('/Attic/', '/')
                     if rcs in rcsmap:
                         e.rcs = rcsmap[rcs]
                     branch = e.revision[:-1]
                     versions[(e.rcs, branch)] = e.revision
                 for e in log:
                     branch = e.revision[:-1]
                     p = versions.get((e.rcs, branch), None)
                     if p is None:
                         p = e.revision[:-2]
                     e.parent = p
                     versions[(e.rcs, branch)] = e.revision
                 # update the log cache
                 if cache:
                     if log:
                         # join up the old and new logs
                         log.sort(key=lambda x: x.date)
                         if oldlog and oldlog[-1].date >= log[0].date:
                             raise logerror(_('log cache overlaps with new log entries,'
                                              ' re-run without cache.'))
                         log = oldlog + log
                         # write the new cachefile
                         ui.note(_('writing cvs log cache %s\n') % cachefile)
                         pickle.dump(log, open(cachefile, 'wb'))
                     else:
                         log = oldlog
                 ui.status(_('%d log entries\n') % len(log))
                 encodings = ui.configlist('convert', 'cvsps.logencoding')
                 if encodings:
                     def revstr(r):
                         # this is needed, because logentry.revision is a tuple of "int"
                         # (e.g. (1, 2) for "1.2")
                         return '.'.join(pycompat.maplist(pycompat.bytestr, r))
                     for entry in log:
                         comment = entry.comment
                         for e in encodings:
                             try:
                                 entry.comment = comment.decode(e).encode('utf-8')
                                 if ui.debugflag:
                                     ui.debug("transcoding by %s: %s of %s\n" %
                                              (e, revstr(entry.revision), entry.file))
                                 break
                             except UnicodeDecodeError:
                                 pass # try next encoding
                             except LookupError as inst: # unknown encoding, maybe
                                 raise error.Abort(inst,
                                                   hint=_('check convert.cvsps.logencoding'
                                                          ' configuration'))
                         else:
                             raise error.Abort(_("no encoding can transcode"
                                                 " CVS log message for %s of %s")
                                               % (revstr(entry.revision), entry.file),
                                               hint=_('check convert.cvsps.logencoding'
                                                      ' configuration'))
                 hook.hook(ui, None, "cvslog", True, log=log)
                 return log
             class changeset(object):
                 '''Class changeset has the following attributes:
                     .id        - integer identifying this changeset (list index)
                     .author    - author name as CVS knows it
                     .branch    - name of branch this changeset is on, or None
                     .comment   - commit message
                     .commitid  - CVS commitid or None
                     .date      - the commit date as a (time,tz) tuple
                     .entries   - list of logentry objects in this changeset
                     .parents   - list of one or two parent changesets
                     .tags      - list of tags on this changeset
                     .synthetic - from synthetic revision "file ... added on branch ..."
                     .mergepoint- the branch that has been merged from or None
                     .branchpoints- the branches that start at the current entry or empty
                 '''
                 def __init__(self, **entries):
                     self.id = None
                     self.synthetic = False
                     self.__dict__.update(entries)
                 def __repr__(self):
                     items = ("%s=%r"%(k, self.__dict__[k]) for k in sorted(self.__dict__))
                     return "%s(%s)"%(type(self).__name__, ", ".join(items))
             def createchangeset(ui, log, fuzz=60, mergefrom=None, mergeto=None):
                 '''Convert log into changesets.'''
                 ui.status(_('creating changesets\n'))
                 # try to order commitids by date
                 mindate = {}
                 for e in log:
                     if e.commitid:
                         mindate[e.commitid] = min(e.date, mindate.get(e.commitid))
                 # Merge changesets
                 log.sort(key=lambda x: (mindate.get(x.commitid), x.commitid, x.comment,
                                         x.author, x.branch, x.date, x.branchpoints))
                 changesets = []
                 files = set()
                 c = None
                 for i, e in enumerate(log):
                     # Check if log entry belongs to the current changeset or not.
                     # Since CVS is file-centric, two different file revisions with
                     # different branchpoints should be treated as belonging to two
                     # different changesets (and the ordering is important and not
                     # honoured by cvsps at this point).
                     #
                     # Consider the following case:
                     # foo 1.1 branchpoints: [MYBRANCH]
                     # bar 1.1 branchpoints: [MYBRANCH, MYBRANCH2]
                     #
                     # Here foo is part only of MYBRANCH, but not MYBRANCH2, e.g. a
                     # later version of foo may be in MYBRANCH2, so foo should be the
                     # first changeset and bar the next and MYBRANCH and MYBRANCH2
                     # should both start off of the bar changeset. No provisions are
                     # made to ensure that this is, in fact, what happens.
                     if not (c and e.branchpoints == c.branchpoints and
                             (# cvs commitids
                              (e.commitid is not None and e.commitid == c.commitid) or
                              (# no commitids, use fuzzy commit detection
                               (e.commitid is None or c.commitid is None) and
                                e.comment == c.comment and
                                e.author == c.author and
                                e.branch == c.branch and
                                ((c.date[0] + c.date[1]) <=
                                 (e.date[0] + e.date[1]) <=
                                 (c.date[0] + c.date[1]) + fuzz) and
                                e.file not in files))):
                         c = changeset(comment=e.comment, author=e.author,
                                       branch=e.branch, date=e.date,
                                       entries=[], mergepoint=e.mergepoint,
                                       branchpoints=e.branchpoints, commitid=e.commitid)
                         changesets.append(c)
                         files = set()
                         if len(changesets) % 100 == 0:
                             t = '%d %s' % (len(changesets), repr(e.comment)[1:-1])
                             ui.status(stringutil.ellipsis(t, 80) + '\n')
                     c.entries.append(e)
                     files.add(e.file)
                     c.date = e.date       # changeset date is date of latest commit in it
                 # Mark synthetic changesets
                 for c in changesets:
                     # Synthetic revisions always get their own changeset, because
                     # the log message includes the filename.  E.g. if you add file3
                     # and file4 on a branch, you get four log entries and three
                     # changesets:
                     #   "File file3 was added on branch ..." (synthetic, 1 entry)
                     #   "File file4 was added on branch ..." (synthetic, 1 entry)
                     #   "Add file3 and file4 to fix ..."     (real, 2 entries)
                     # Hence the check for 1 entry here.
                     c.synthetic = len(c.entries) == 1 and c.entries[0].synthetic
                 # Sort files in each changeset
                 def entitycompare(l, r):
                     'Mimic cvsps sorting order'
                     l = l.file.split('/')
                     r = r.file.split('/')
                     nl = len(l)
                     nr = len(r)
                     n = min(nl, nr)
                     for i in range(n):
                         if i + 1 == nl and nl < nr:
                             return -1
                         elif i + 1 == nr and nl > nr:
                             return +1
                         elif l[i] < r[i]:
                             return -1
                         elif l[i] > r[i]:
                             return +1
                     return 0
                 for c in changesets:
                     c.entries.sort(entitycompare)
                 # Sort changesets by date
                 odd = set()
                 def cscmp(l, r):
                     d = sum(l.date) - sum(r.date)
                     if d:
                         return d
                     # detect vendor branches and initial commits on a branch
                     le = {}
                     for e in l.entries:
                         le[e.rcs] = e.revision
                     re = {}
                     for e in r.entries:
                         re[e.rcs] = e.revision
                     d = 0
                     for e in l.entries:
                         if re.get(e.rcs, None) == e.parent:
                             assert not d
                             d = 1
                             break
                     for e in r.entries:
                         if le.get(e.rcs, None) == e.parent:
                             if d:
                                 odd.add((l, r))
                             d = -1
                             break
                     # By this point, the changesets are sufficiently compared that
                     # we don't really care about ordering. However, this leaves
                     # some race conditions in the tests, so we compare on the
                     # number of files modified, the files contained in each
                     # changeset, and the branchpoints in the change to ensure test
                     # output remains stable.
                     # recommended replacement for cmp from
                     # https://docs.python.org/3.0/whatsnew/3.0.html
                     c = lambda x, y: (x > y) - (x < y)
                     # Sort bigger changes first.
                     if not d:
                         d = c(len(l.entries), len(r.entries))
                     # Try sorting by filename in the change.
                     if not d:
                         d = c([e.file for e in l.entries], [e.file for e in r.entries])
                     # Try and put changes without a branch point before ones with
                     # a branch point.
                     if not d:
                         d = c(len(l.branchpoints), len(r.branchpoints))
                     return d
                 changesets.sort(cscmp)
                 # Collect tags
                 globaltags = {}
                 for c in changesets:
                     for e in c.entries:
                         for tag in e.tags:
                             # remember which is the latest changeset to have this tag
                             globaltags[tag] = c
                 for c in changesets:
                     tags = set()
                     for e in c.entries:
                         tags.update(e.tags)
                     # remember tags only if this is the latest changeset to have it
                     c.tags = sorted(tag for tag in tags if globaltags[tag] is c)
                 # Find parent changesets, handle {{mergetobranch BRANCHNAME}}
                 # by inserting dummy changesets with two parents, and handle
                 # {{mergefrombranch BRANCHNAME}} by setting two parents.
                 if mergeto is None:
-                    mergeto = r'{{mergetobranch ([-\w]+)}}'
+                    mergeto = br'{{mergetobranch ([-\w]+)}}'
                 if mergeto:
                     mergeto = re.compile(mergeto)
                 if mergefrom is None:
-                    mergefrom = r'{{mergefrombranch ([-\w]+)}}'
+                    mergefrom = br'{{mergefrombranch ([-\w]+)}}'
                 if mergefrom:
                     mergefrom = re.compile(mergefrom)
                 versions = {}    # changeset index where we saw any particular file version
                 branches = {}    # changeset index where we saw a branch
                 n = len(changesets)
                 i = 0
                 while i < n:
                     c = changesets[i]
                     for f in c.entries:
                         versions[(f.rcs, f.revision)] = i
                     p = None
                     if c.branch in branches:
                         p = branches[c.branch]
                     else:
                         # first changeset on a new branch
                         # the parent is a changeset with the branch in its
                         # branchpoints such that it is the latest possible
                         # commit without any intervening, unrelated commits.
                         for candidate in xrange(i):
                             if c.branch not in changesets[candidate].branchpoints:
                                 if p is not None:
                                     break
                                 continue
                             p = candidate
                     c.parents = []
                     if p is not None:
                         p = changesets[p]
                         # Ensure no changeset has a synthetic changeset as a parent.
                         while p.synthetic:
                             assert len(p.parents) <= 1, \
                                    _('synthetic changeset cannot have multiple parents')
                             if p.parents:
                                 p = p.parents[0]
                             else:
                                 p = None
                                 break
                         if p is not None:
                             c.parents.append(p)
                     if c.mergepoint:
                         if c.mergepoint == 'HEAD':
                             c.mergepoint = None
                         c.parents.append(changesets[branches[c.mergepoint]])
                     if mergefrom:
                         m = mergefrom.search(c.comment)
                         if m:
                             m = m.group(1)
                             if m == 'HEAD':
                                 m = None
                             try:
                                 candidate = changesets[branches[m]]
                             except KeyError:
                                 ui.warn(_("warning: CVS commit message references "
                                           "non-existent branch %r:\n%s\n")
                                         % (m, c.comment))
                             if m in branches and c.branch != m and not candidate.synthetic:
                                 c.parents.append(candidate)
                     if mergeto:
                         m = mergeto.search(c.comment)
                         if m:
                             if m.groups():
                                 m = m.group(1)
                                 if m == 'HEAD':
                                     m = None
                             else:
                                 m = None   # if no group found then merge to HEAD
                             if m in branches and c.branch != m:
                                 # insert empty changeset for merge
                                 cc = changeset(
                                     author=c.author, branch=m, date=c.date,
                                     comment='convert-repo: CVS merge from branch %s'
                                     % c.branch,
                                     entries=[], tags=[],
                                     parents=[changesets[branches[m]], c])
                                 changesets.insert(i + 1, cc)
                                 branches[m] = i + 1
                                 # adjust our loop counters now we have inserted a new entry
                                 n += 1
                                 i += 2
                                 continue
                     branches[c.branch] = i
                     i += 1
                 # Drop synthetic changesets (safe now that we have ensured no other
                 # changesets can have them as parents).
                 i = 0
                 while i < len(changesets):
                     if changesets[i].synthetic:
                         del changesets[i]
                     else:
                         i += 1
                 # Number changesets
                 for i, c in enumerate(changesets):
                     c.id = i + 1
                 if odd:
                     for l, r in odd:
                         if l.id is not None and r.id is not None:
                             ui.warn(_('changeset %d is both before and after %d\n')
                                     % (l.id, r.id))
                 ui.status(_('%d changeset entries\n') % len(changesets))
                 hook.hook(ui, None, "cvschangesets", True, changesets=changesets)
                 return changesets
             def debugcvsps(ui, *args, **opts):
                 '''Read CVS rlog for current directory or named path in
                 repository, and convert the log to changesets based on matching
                 commit log entries and dates.
                 '''
                 opts = pycompat.byteskwargs(opts)
                 if opts["new_cache"]:
                     cache = "write"
                 elif opts["update_cache"]:
                     cache = "update"
                 else:
                     cache = None
                 revisions = opts["revisions"]
                 try:
                     if args:
                         log = []
                         for d in args:
                             log += createlog(ui, d, root=opts["root"], cache=cache)
                     else:
                         log = createlog(ui, root=opts["root"], cache=cache)
                 except logerror as e:
                     ui.write("%r\n"%e)
                     return
                 changesets = createchangeset(ui, log, opts["fuzz"])
                 del log
                 # Print changesets (optionally filtered)
                 off = len(revisions)
                 branches = {}    # latest version number in each branch
                 ancestors = {}   # parent branch
                 for cs in changesets:
                     if opts["ancestors"]:
                         if cs.branch not in branches and cs.parents and cs.parents[0].id:
                             ancestors[cs.branch] = (changesets[cs.parents[0].id - 1].branch,
                                                     cs.parents[0].id)
                         branches[cs.branch] = cs.id
                     # limit by branches
                     if opts["branches"] and (cs.branch or 'HEAD') not in opts["branches"]:
                         continue
                     if not off:
                         # Note: trailing spaces on several lines here are needed to have
                         #       bug-for-bug compatibility with cvsps.
                         ui.write('---------------------\n')
                         ui.write(('PatchSet %d \n' % cs.id))
                         ui.write(('Date: %s\n' % dateutil.datestr(cs.date,
                                                              '%Y/%m/%d %H:%M:%S %1%2')))
                         ui.write(('Author: %s\n' % cs.author))
                         ui.write(('Branch: %s\n' % (cs.branch or 'HEAD')))
                         ui.write(('Tag%s: %s \n' % (['', 's'][len(cs.tags) > 1],
                                               ','.join(cs.tags) or '(none)')))
                         if cs.branchpoints:
                             ui.write(('Branchpoints: %s \n') %
                                      ', '.join(sorted(cs.branchpoints)))
                         if opts["parents"] and cs.parents:
                             if len(cs.parents) > 1:
                                 ui.write(('Parents: %s\n' %
                                          (','.join([(b"%d" % p.id) for p in cs.parents]))))
                             else:
                                 ui.write(('Parent: %d\n' % cs.parents[0].id))
                         if opts["ancestors"]:
                             b = cs.branch
                             r = []
                             while b:
                                 b, c = ancestors[b]
                                 r.append('%s:%d:%d' % (b or "HEAD", c, branches[b]))
                             if r:
                                 ui.write(('Ancestors: %s\n' % (','.join(r))))
                         ui.write(('Log:\n'))
                         ui.write('%s\n\n' % cs.comment)
                         ui.write(('Members: \n'))
                         for f in cs.entries:
                             fn = f.file
                             if fn.startswith(opts["prefix"]):
                                 fn = fn[len(opts["prefix"]):]
                             ui.write('\t%s:%s->%s%s \n' % (
                                     fn, '.'.join([str(x) for x in f.parent]) or 'INITIAL',
                                     '.'.join([(b"%d" % x) for x in f.revision]),
                                     ['', '(DEAD)'][f.dead]))
                         ui.write('\n')
                     # have we seen the start tag?
                     if revisions and off:
                         if revisions[0] == (b"%d" % cs.id) or \
                             revisions[0] in cs.tags:
                             off = False
                     # see if we reached the end tag
                     if len(revisions) > 1 and not off:
                         if revisions[1] == (b"%d" % cs.id) or \
                             revisions[1] in cs.tags:
                             break