##// END OF EJS Templates
Fix network pull of repo files with "%" in their base64 encoding.
mpm@selenic.com -
r15:6daf7757 default
parent child Browse files
Show More
@@ -1,575 +1,578 b''
1 1 # hg.py - repository classes for mercurial
2 2 #
3 3 # Copyright 2005 Matt Mackall <mpm@selenic.com>
4 4 #
5 5 # This software may be used and distributed according to the terms
6 6 # of the GNU General Public License, incorporated herein by reference.
7 7
8 8 import sys, struct, sha, socket, os, time, base64, re, urllib2, binascii
9 import urllib
9 10 from mercurial import byterange
10 11 from mercurial.transaction import *
11 12 from mercurial.revlog import *
12 13
13 14 def hex(node): return binascii.hexlify(node)
14 15 def bin(node): return binascii.unhexlify(node)
15 16
16 17 class filelog(revlog):
17 18 def __init__(self, opener, path):
18 19 s = self.encodepath(path)
19 20 revlog.__init__(self, opener, os.path.join("data", s + "i"),
20 21 os.path.join("data", s))
21 22
22 23 def encodepath(self, path):
23 24 s = sha.sha(path).digest()
24 25 s = base64.encodestring(s)[:-3]
25 26 s = re.sub("\+", "%", s)
26 27 s = re.sub("/", "_", s)
27 28 return s
28 29
29 30 def read(self, node):
30 31 return self.revision(node)
31 32 def add(self, text, transaction, link, p1=None, p2=None):
32 33 return self.addrevision(text, transaction, link, p1, p2)
33 34
34 35 def resolvedag(self, old, new, transaction, link):
35 36 """resolve unmerged heads in our DAG"""
36 37 if old == new: return None
37 38 a = self.ancestor(old, new)
38 39 if old == a: return new
39 40 return self.merge3(old, new, a, transaction, link)
40 41
41 42 def merge3(self, my, other, base, transaction, link):
42 43 """perform a 3-way merge and append the result"""
43 44 def temp(prefix, node):
44 45 (fd, name) = tempfile.mkstemp(prefix)
45 46 f = os.fdopen(fd, "w")
46 47 f.write(self.revision(node))
47 48 f.close()
48 49 return name
49 50
50 51 a = temp("local", my)
51 52 b = temp("remote", other)
52 53 c = temp("parent", base)
53 54
54 55 cmd = os.environ["HGMERGE"]
55 56 r = os.system("%s %s %s %s" % (cmd, a, b, c))
56 57 if r:
57 58 raise "Merge failed, implement rollback!"
58 59
59 60 t = open(a).read()
60 61 os.unlink(a)
61 62 os.unlink(b)
62 63 os.unlink(c)
63 64 return self.addrevision(t, transaction, link, my, other)
64 65
65 66 def merge(self, other, transaction, linkseq, link):
66 67 """perform a merge and resolve resulting heads"""
67 68 (o, n) = self.mergedag(other, transaction, linkseq)
68 69 return self.resolvedag(o, n, transaction, link)
69 70
70 71 class manifest(revlog):
71 72 def __init__(self, opener):
72 73 self.mapcache = None
73 74 self.listcache = None
74 75 self.addlist = None
75 76 revlog.__init__(self, opener, "00manifest.i", "00manifest.d")
76 77
77 78 def read(self, node):
78 79 if self.mapcache and self.mapcache[0] == node:
79 80 return self.mapcache[1]
80 81 text = self.revision(node)
81 82 map = {}
82 83 self.listcache = text.splitlines(1)
83 84 for l in self.listcache:
84 85 (f, n) = l.split('\0')
85 86 map[f] = bin(n[:40])
86 87 self.mapcache = (node, map)
87 88 return map
88 89
89 90 def diff(self, a, b):
90 91 # this is sneaky, as we're not actually using a and b
91 92 if self.listcache:
92 93 return mdiff.diff(self.listcache, self.addlist, 1)
93 94 else:
94 95 return mdiff.diff(a, b)
95 96
96 97 def add(self, map, transaction, link, p1=None, p2=None):
97 98 files = map.keys()
98 99 files.sort()
99 100
100 101 self.addlist = ["%s\000%s\n" % (f, hex(map[f])) for f in files]
101 102 text = "".join(self.addlist)
102 103
103 104 n = self.addrevision(text, transaction, link, p1, p2)
104 105 self.mapcache = (n, map)
105 106 self.listcache = self.addlist
106 107
107 108 return n
108 109
109 110 class changelog(revlog):
110 111 def __init__(self, opener):
111 112 revlog.__init__(self, opener, "00changelog.i", "00changelog.d")
112 113
113 114 def extract(self, text):
114 115 last = text.index("\n\n")
115 116 desc = text[last + 2:]
116 117 l = text[:last].splitlines()
117 118 manifest = bin(l[0])
118 119 user = l[1]
119 120 date = l[2]
120 121 files = l[3:]
121 122 return (manifest, user, date, files, desc)
122 123
123 124 def read(self, node):
124 125 return self.extract(self.revision(node))
125 126
126 127 def add(self, manifest, list, desc, transaction, p1=None, p2=None):
127 128 try: user = os.environ["HGUSER"]
128 129 except: user = os.environ["LOGNAME"] + '@' + socket.getfqdn()
129 130 date = "%d %d" % (time.time(), time.timezone)
130 131 list.sort()
131 132 l = [hex(manifest), user, date] + list + ["", desc]
132 133 text = "\n".join(l)
133 134 return self.addrevision(text, transaction, self.count(), p1, p2)
134 135
135 136 def merge3(self, my, other, base):
136 137 pass
137 138
138 139 class dircache:
139 140 def __init__(self, opener):
140 141 self.opener = opener
141 142 self.dirty = 0
142 143 self.map = None
143 144 def __del__(self):
144 145 if self.dirty: self.write()
145 146 def __getitem__(self, key):
146 147 try:
147 148 return self.map[key]
148 149 except TypeError:
149 150 self.read()
150 151 return self[key]
151 152
152 153 def read(self):
153 154 if self.map is not None: return self.map
154 155
155 156 self.map = {}
156 157 try:
157 158 st = self.opener("dircache").read()
158 159 except: return
159 160
160 161 pos = 0
161 162 while pos < len(st):
162 163 e = struct.unpack(">llll", st[pos:pos+16])
163 164 l = e[3]
164 165 pos += 16
165 166 f = st[pos:pos + l]
166 167 self.map[f] = e[:3]
167 168 pos += l
168 169
169 170 def update(self, files):
170 171 if not files: return
171 172 self.read()
172 173 self.dirty = 1
173 174 for f in files:
174 175 try:
175 176 s = os.stat(f)
176 177 self.map[f] = (s.st_mode, s.st_size, s.st_mtime)
177 178 except IOError:
178 179 self.remove(f)
179 180
180 181 def taint(self, files):
181 182 if not files: return
182 183 self.read()
183 184 self.dirty = 1
184 185 for f in files:
185 186 self.map[f] = (0, -1, 0)
186 187
187 188 def remove(self, files):
188 189 if not files: return
189 190 self.read()
190 191 self.dirty = 1
191 192 for f in files:
192 193 try: del self[f]
193 194 except: pass
194 195
195 196 def clear(self):
196 197 self.map = {}
197 198 self.dirty = 1
198 199
199 200 def write(self):
200 201 st = self.opener("dircache", "w")
201 202 for f, e in self.map.items():
202 203 e = struct.pack(">llll", e[0], e[1], e[2], len(f))
203 204 st.write(e + f)
204 205 self.dirty = 0
205 206
206 207 def copy(self):
207 208 self.read()
208 209 return self.map.copy()
209 210
210 211 # used to avoid circular references so destructors work
211 212 def opener(base):
212 213 p = base
213 214 def o(path, mode="r"):
215 if p[:7] == "http://":
216 f = os.path.join(p, urllib.quote(path))
217 return httprangereader(f)
218
214 219 f = os.path.join(p, path)
215 if p[:7] == "http://":
216 return httprangereader(f)
217 220
218 221 if mode != "r" and os.path.isfile(f):
219 222 s = os.stat(f)
220 223 if s.st_nlink > 1:
221 224 file(f + ".tmp", "w").write(file(f).read())
222 225 os.rename(f+".tmp", f)
223 226
224 227 return file(f, mode)
225 228
226 229 return o
227 230
228 231 class repository:
229 232 def __init__(self, ui, path=None, create=0):
230 233 self.remote = 0
231 234 if path and path[:7] == "http://":
232 235 self.remote = 1
233 236 self.path = path
234 237 else:
235 238 if not path:
236 239 p = os.getcwd()
237 240 while not os.path.isdir(os.path.join(p, ".hg")):
238 241 p = os.path.dirname(p)
239 242 if p == "/": raise "No repo found"
240 243 path = p
241 244 self.path = os.path.join(path, ".hg")
242 245
243 246 self.root = path
244 247 self.ui = ui
245 248
246 249 if create:
247 250 os.mkdir(self.path)
248 251 os.mkdir(self.join("data"))
249 252
250 253 self.opener = opener(self.path)
251 254 self.manifest = manifest(self.opener)
252 255 self.changelog = changelog(self.opener)
253 256 self.ignorelist = None
254 257
255 258 if not self.remote:
256 259 self.dircache = dircache(self.opener)
257 260 try:
258 261 self.current = bin(self.opener("current").read())
259 262 except IOError:
260 263 self.current = None
261 264
262 265 def setcurrent(self, node):
263 266 self.current = node
264 267 self.opener("current", "w").write(hex(node))
265 268
266 269 def ignore(self, f):
267 270 if self.ignorelist is None:
268 271 self.ignorelist = []
269 272 try:
270 273 l = open(os.path.join(self.root, ".hgignore")).readlines()
271 274 for pat in l:
272 275 if pat != "\n":
273 276 self.ignorelist.append(re.compile(pat[:-1]))
274 277 except IOError: pass
275 278 for pat in self.ignorelist:
276 279 if pat.search(f): return True
277 280 return False
278 281
279 282 def join(self, f):
280 283 return os.path.join(self.path, f)
281 284
282 285 def file(self, f):
283 286 return filelog(self.opener, f)
284 287
285 288 def transaction(self):
286 289 return transaction(self.opener, self.join("journal"))
287 290
288 291 def merge(self, other):
289 292 tr = self.transaction()
290 293 changed = {}
291 294 new = {}
292 295 seqrev = self.changelog.count()
293 296 # some magic to allow fiddling in nested scope
294 297 nextrev = [seqrev]
295 298
296 299 # helpers for back-linking file revisions to local changeset
297 300 # revisions so we can immediately get to changeset from annotate
298 301 def accumulate(text):
299 302 # track which files are added in which changeset and the
300 303 # corresponding _local_ changeset revision
301 304 files = self.changelog.extract(text)[3]
302 305 for f in files:
303 306 changed.setdefault(f, []).append(nextrev[0])
304 307 nextrev[0] += 1
305 308
306 309 def seq(start):
307 310 while 1:
308 311 yield start
309 312 start += 1
310 313
311 314 def lseq(l):
312 315 for r in l:
313 316 yield r
314 317
315 318 # begin the import/merge of changesets
316 319 self.ui.status("merging new changesets\n")
317 320 (co, cn) = self.changelog.mergedag(other.changelog, tr,
318 321 seq(seqrev), accumulate)
319 322 resolverev = self.changelog.count()
320 323
321 324 # is there anything to do?
322 325 if co == cn:
323 326 tr.close()
324 327 return
325 328
326 329 # do we need to resolve?
327 330 simple = (co == self.changelog.ancestor(co, cn))
328 331
329 332 # merge all files changed by the changesets,
330 333 # keeping track of the new tips
331 334 changelist = changed.keys()
332 335 changelist.sort()
333 336 for f in changelist:
334 337 sys.stdout.write(".")
335 338 sys.stdout.flush()
336 339 r = self.file(f)
337 340 node = r.merge(other.file(f), tr, lseq(changed[f]), resolverev)
338 341 if node:
339 342 new[f] = node
340 343 sys.stdout.write("\n")
341 344
342 345 # begin the merge of the manifest
343 346 self.ui.status("merging manifests\n")
344 347 (mm, mo) = self.manifest.mergedag(other.manifest, tr, seq(seqrev))
345 348
346 349 # For simple merges, we don't need to resolve manifests or changesets
347 350 if simple:
348 351 tr.close()
349 352 return
350 353
351 354 ma = self.manifest.ancestor(mm, mo)
352 355
353 356 # resolve the manifest to point to all the merged files
354 357 self.ui.status("resolving manifests\n")
355 358 mmap = self.manifest.read(mm) # mine
356 359 omap = self.manifest.read(mo) # other
357 360 amap = self.manifest.read(ma) # ancestor
358 361 nmap = {}
359 362
360 363 for f, mid in mmap.iteritems():
361 364 if f in omap:
362 365 if mid != omap[f]:
363 366 nmap[f] = new.get(f, mid) # use merged version
364 367 else:
365 368 nmap[f] = new.get(f, mid) # they're the same
366 369 del omap[f]
367 370 elif f in amap:
368 371 if mid != amap[f]:
369 372 pass # we should prompt here
370 373 else:
371 374 pass # other deleted it
372 375 else:
373 376 nmap[f] = new.get(f, mid) # we created it
374 377
375 378 del mmap
376 379
377 380 for f, oid in omap.iteritems():
378 381 if f in amap:
379 382 if oid != amap[f]:
380 383 pass # this is the nasty case, we should prompt
381 384 else:
382 385 pass # probably safe
383 386 else:
384 387 nmap[f] = new.get(f, oid) # remote created it
385 388
386 389 del omap
387 390 del amap
388 391
389 392 node = self.manifest.add(nmap, tr, resolverev, mm, mo)
390 393
391 394 # Now all files and manifests are merged, we add the changed files
392 395 # and manifest id to the changelog
393 396 self.ui.status("committing merge changeset\n")
394 397 new = new.keys()
395 398 new.sort()
396 399 if co == cn: cn = -1
397 400
398 401 edittext = "\n"+"".join(["HG: changed %s\n" % f for f in new])
399 402 edittext = self.ui.edit(edittext)
400 403 n = self.changelog.add(node, new, edittext, tr, co, cn)
401 404
402 405 tr.close()
403 406
404 407 def commit(self, update = None, text = ""):
405 408 tr = self.transaction()
406 409
407 410 try:
408 411 remove = [ l[:-1] for l in self.opener("to-remove") ]
409 412 os.unlink(self.join("to-remove"))
410 413
411 414 except IOError:
412 415 remove = []
413 416
414 417 if update == None:
415 418 update = self.diffdir(self.root)[0]
416 419
417 420 # check in files
418 421 new = {}
419 422 linkrev = self.changelog.count()
420 423 for f in update:
421 424 try:
422 425 t = file(f).read()
423 426 except IOError:
424 427 remove.append(f)
425 428 continue
426 429 r = self.file(f)
427 430 new[f] = r.add(t, tr, linkrev)
428 431
429 432 # update manifest
430 433 mmap = self.manifest.read(self.manifest.tip())
431 434 mmap.update(new)
432 435 for f in remove:
433 436 del mmap[f]
434 437 mnode = self.manifest.add(mmap, tr, linkrev)
435 438
436 439 # add changeset
437 440 new = new.keys()
438 441 new.sort()
439 442
440 443 edittext = text + "\n"+"".join(["HG: changed %s\n" % f for f in new])
441 444 edittext = self.ui.edit(edittext)
442 445
443 446 n = self.changelog.add(mnode, new, edittext, tr)
444 447 tr.close()
445 448
446 449 self.setcurrent(n)
447 450 self.dircache.update(new)
448 451 self.dircache.remove(remove)
449 452
450 453 def checkdir(self, path):
451 454 d = os.path.dirname(path)
452 455 if not d: return
453 456 if not os.path.isdir(d):
454 457 self.checkdir(d)
455 458 os.mkdir(d)
456 459
457 460 def checkout(self, node):
458 461 # checkout is really dumb at the moment
459 462 # it ought to basically merge
460 463 change = self.changelog.read(node)
461 464 mmap = self.manifest.read(change[0])
462 465
463 466 l = mmap.keys()
464 467 l.sort()
465 468 stats = []
466 469 for f in l:
467 470 r = self.file(f)
468 471 t = r.revision(mmap[f])
469 472 try:
470 473 file(f, "w").write(t)
471 474 except:
472 475 self.checkdir(f)
473 476 file(f, "w").write(t)
474 477
475 478 self.setcurrent(node)
476 479 self.dircache.clear()
477 480 self.dircache.update(l)
478 481
479 482 def diffdir(self, path):
480 483 dc = self.dircache.copy()
481 484 changed = []
482 485 mf = {}
483 486 added = []
484 487
485 488 if self.current:
486 489 change = self.changelog.read(self.current)
487 490 mf = self.manifest.read(change[0])
488 491
489 492 for dir, subdirs, files in os.walk(self.root):
490 493 d = dir[len(self.root)+1:]
491 494 if ".hg" in subdirs: subdirs.remove(".hg")
492 495
493 496 for f in files:
494 497 fn = os.path.join(d, f)
495 498 try: s = os.stat(fn)
496 499 except: continue
497 500 if fn in dc:
498 501 c = dc[fn]
499 502 del dc[fn]
500 503 if c[1] != s.st_size:
501 504 changed.append(fn)
502 505 elif c[0] != s.st_mode or c[2] != s.st_mtime:
503 506 t1 = file(fn).read()
504 507 t2 = self.file(fn).revision(mf[fn])
505 508 if t1 != t2:
506 509 changed.append(fn)
507 510 else:
508 511 if self.ignore(fn): continue
509 512 added.append(fn)
510 513
511 514 deleted = dc.keys()
512 515 deleted.sort()
513 516
514 517 return (changed, added, deleted)
515 518
516 519 def add(self, list):
517 520 self.dircache.taint(list)
518 521
519 522 def remove(self, list):
520 523 dl = self.opener("to-remove", "a")
521 524 for f in list:
522 525 dl.write(f + "\n")
523 526
524 527 class ui:
525 528 def __init__(self, verbose=False, debug=False):
526 529 self.verbose = verbose
527 530 def write(self, *args):
528 531 for a in args:
529 532 sys.stdout.write(str(a))
530 533 def prompt(self, msg, pat):
531 534 while 1:
532 535 sys.stdout.write(msg)
533 536 r = sys.stdin.readline()[:-1]
534 537 if re.match(pat, r):
535 538 return r
536 539 def status(self, *msg):
537 540 self.write(*msg)
538 541 def warn(self, msg):
539 542 self.write(*msg)
540 543 def note(self, msg):
541 544 if self.verbose: self.write(*msg)
542 545 def debug(self, msg):
543 546 if self.debug: self.write(*msg)
544 547 def edit(self, text):
545 548 (fd, name) = tempfile.mkstemp("hg")
546 549 f = os.fdopen(fd, "w")
547 550 f.write(text)
548 551 f.close()
549 552
550 553 editor = os.environ.get("EDITOR", "vi")
551 554 r = os.system("%s %s" % (editor, name))
552 555 if r:
553 556 raise "Edit failed!"
554 557
555 558 t = open(name).read()
556 559 t = re.sub("(?m)^HG:.*\n", "", t)
557 560
558 561 return t
559 562
560 563
561 564 class httprangereader:
562 565 def __init__(self, url):
563 566 self.url = url
564 567 self.pos = 0
565 568 def seek(self, pos):
566 569 self.pos = pos
567 570 def read(self, bytes=None):
568 571 opener = urllib2.build_opener(byterange.HTTPRangeHandler())
569 572 urllib2.install_opener(opener)
570 573 req = urllib2.Request(self.url)
571 574 end = ''
572 575 if bytes: end = self.pos + bytes
573 576 req.add_header('Range', 'bytes=%d-%s' % (self.pos, end))
574 577 f = urllib2.urlopen(req)
575 578 return f.read()
General Comments 0
You need to be logged in to leave comments. Login now