##// END OF EJS Templates
parsers.c: remove warning: 'size' may be used uninitialized in this function...
Mads Kiilerich -
r17165:249cc4ec default
parent child Browse files
Show More
@@ -1,1552 +1,1552 b''
1 1 /*
2 2 parsers.c - efficient content parsing
3 3
4 4 Copyright 2008 Matt Mackall <mpm@selenic.com> and others
5 5
6 6 This software may be used and distributed according to the terms of
7 7 the GNU General Public License, incorporated herein by reference.
8 8 */
9 9
10 10 #include <Python.h>
11 11 #include <ctype.h>
12 12 #include <string.h>
13 13
14 14 #include "util.h"
15 15
16 16 static inline int hexdigit(const char *p, Py_ssize_t off)
17 17 {
18 18 char c = p[off];
19 19
20 20 if (c >= '0' && c <= '9')
21 21 return c - '0';
22 22 if (c >= 'a' && c <= 'f')
23 23 return c - 'a' + 10;
24 24 if (c >= 'A' && c <= 'F')
25 25 return c - 'A' + 10;
26 26
27 27 PyErr_SetString(PyExc_ValueError, "input contains non-hex character");
28 28 return 0;
29 29 }
30 30
31 31 /*
32 32 * Turn a hex-encoded string into binary.
33 33 */
34 34 static PyObject *unhexlify(const char *str, int len)
35 35 {
36 36 PyObject *ret;
37 37 char *d;
38 38 int i;
39 39
40 40 ret = PyBytes_FromStringAndSize(NULL, len / 2);
41 41
42 42 if (!ret)
43 43 return NULL;
44 44
45 45 d = PyBytes_AsString(ret);
46 46
47 47 for (i = 0; i < len;) {
48 48 int hi = hexdigit(str, i++);
49 49 int lo = hexdigit(str, i++);
50 50 *d++ = (hi << 4) | lo;
51 51 }
52 52
53 53 return ret;
54 54 }
55 55
56 56 /*
57 57 * This code assumes that a manifest is stitched together with newline
58 58 * ('\n') characters.
59 59 */
60 60 static PyObject *parse_manifest(PyObject *self, PyObject *args)
61 61 {
62 62 PyObject *mfdict, *fdict;
63 63 char *str, *cur, *start, *zero;
64 64 int len;
65 65
66 66 if (!PyArg_ParseTuple(args, "O!O!s#:parse_manifest",
67 67 &PyDict_Type, &mfdict,
68 68 &PyDict_Type, &fdict,
69 69 &str, &len))
70 70 goto quit;
71 71
72 72 for (start = cur = str, zero = NULL; cur < str + len; cur++) {
73 73 PyObject *file = NULL, *node = NULL;
74 74 PyObject *flags = NULL;
75 75 int nlen;
76 76
77 77 if (!*cur) {
78 78 zero = cur;
79 79 continue;
80 80 }
81 81 else if (*cur != '\n')
82 82 continue;
83 83
84 84 if (!zero) {
85 85 PyErr_SetString(PyExc_ValueError,
86 86 "manifest entry has no separator");
87 87 goto quit;
88 88 }
89 89
90 90 file = PyBytes_FromStringAndSize(start, zero - start);
91 91
92 92 if (!file)
93 93 goto bail;
94 94
95 95 nlen = cur - zero - 1;
96 96
97 97 node = unhexlify(zero + 1, nlen > 40 ? 40 : nlen);
98 98 if (!node)
99 99 goto bail;
100 100
101 101 if (nlen > 40) {
102 102 flags = PyBytes_FromStringAndSize(zero + 41,
103 103 nlen - 40);
104 104 if (!flags)
105 105 goto bail;
106 106
107 107 if (PyDict_SetItem(fdict, file, flags) == -1)
108 108 goto bail;
109 109 }
110 110
111 111 if (PyDict_SetItem(mfdict, file, node) == -1)
112 112 goto bail;
113 113
114 114 start = cur + 1;
115 115 zero = NULL;
116 116
117 117 Py_XDECREF(flags);
118 118 Py_XDECREF(node);
119 119 Py_XDECREF(file);
120 120 continue;
121 121 bail:
122 122 Py_XDECREF(flags);
123 123 Py_XDECREF(node);
124 124 Py_XDECREF(file);
125 125 goto quit;
126 126 }
127 127
128 128 if (len > 0 && *(cur - 1) != '\n') {
129 129 PyErr_SetString(PyExc_ValueError,
130 130 "manifest contains trailing garbage");
131 131 goto quit;
132 132 }
133 133
134 134 Py_INCREF(Py_None);
135 135 return Py_None;
136 136 quit:
137 137 return NULL;
138 138 }
139 139
140 140 static PyObject *parse_dirstate(PyObject *self, PyObject *args)
141 141 {
142 142 PyObject *dmap, *cmap, *parents = NULL, *ret = NULL;
143 143 PyObject *fname = NULL, *cname = NULL, *entry = NULL;
144 144 char *str, *cur, *end, *cpos;
145 145 int state, mode, size, mtime;
146 146 unsigned int flen;
147 147 int len;
148 148
149 149 if (!PyArg_ParseTuple(args, "O!O!s#:parse_dirstate",
150 150 &PyDict_Type, &dmap,
151 151 &PyDict_Type, &cmap,
152 152 &str, &len))
153 153 goto quit;
154 154
155 155 /* read parents */
156 156 if (len < 40)
157 157 goto quit;
158 158
159 159 parents = Py_BuildValue("s#s#", str, 20, str + 20, 20);
160 160 if (!parents)
161 161 goto quit;
162 162
163 163 /* read filenames */
164 164 cur = str + 40;
165 165 end = str + len;
166 166
167 167 while (cur < end - 17) {
168 168 /* unpack header */
169 169 state = *cur;
170 170 mode = getbe32(cur + 1);
171 171 size = getbe32(cur + 5);
172 172 mtime = getbe32(cur + 9);
173 173 flen = getbe32(cur + 13);
174 174 cur += 17;
175 175 if (cur + flen > end || cur + flen < cur) {
176 176 PyErr_SetString(PyExc_ValueError, "overflow in dirstate");
177 177 goto quit;
178 178 }
179 179
180 180 entry = Py_BuildValue("ciii", state, mode, size, mtime);
181 181 if (!entry)
182 182 goto quit;
183 183 PyObject_GC_UnTrack(entry); /* don't waste time with this */
184 184
185 185 cpos = memchr(cur, 0, flen);
186 186 if (cpos) {
187 187 fname = PyBytes_FromStringAndSize(cur, cpos - cur);
188 188 cname = PyBytes_FromStringAndSize(cpos + 1,
189 189 flen - (cpos - cur) - 1);
190 190 if (!fname || !cname ||
191 191 PyDict_SetItem(cmap, fname, cname) == -1 ||
192 192 PyDict_SetItem(dmap, fname, entry) == -1)
193 193 goto quit;
194 194 Py_DECREF(cname);
195 195 } else {
196 196 fname = PyBytes_FromStringAndSize(cur, flen);
197 197 if (!fname ||
198 198 PyDict_SetItem(dmap, fname, entry) == -1)
199 199 goto quit;
200 200 }
201 201 cur += flen;
202 202 Py_DECREF(fname);
203 203 Py_DECREF(entry);
204 204 fname = cname = entry = NULL;
205 205 }
206 206
207 207 ret = parents;
208 208 Py_INCREF(ret);
209 209 quit:
210 210 Py_XDECREF(fname);
211 211 Py_XDECREF(cname);
212 212 Py_XDECREF(entry);
213 213 Py_XDECREF(parents);
214 214 return ret;
215 215 }
216 216
217 217 static inline int getintat(PyObject *tuple, int off, uint32_t *v)
218 218 {
219 219 PyObject *o = PyTuple_GET_ITEM(tuple, off);
220 220 long val;
221 221
222 222 if (PyInt_Check(o))
223 223 val = PyInt_AS_LONG(o);
224 224 else if (PyLong_Check(o)) {
225 225 val = PyLong_AsLong(o);
226 226 if (val == -1 && PyErr_Occurred())
227 227 return -1;
228 228 } else {
229 229 PyErr_SetString(PyExc_TypeError, "expected an int or long");
230 230 return -1;
231 231 }
232 232 if (LONG_MAX > INT_MAX && (val > INT_MAX || val < INT_MIN)) {
233 233 PyErr_SetString(PyExc_OverflowError,
234 234 "Python value to large to convert to uint32_t");
235 235 return -1;
236 236 }
237 237 *v = (uint32_t)val;
238 238 return 0;
239 239 }
240 240
241 241 static PyObject *dirstate_unset;
242 242
243 243 /*
244 244 * Efficiently pack a dirstate object into its on-disk format.
245 245 */
246 246 static PyObject *pack_dirstate(PyObject *self, PyObject *args)
247 247 {
248 248 PyObject *packobj = NULL;
249 249 PyObject *map, *copymap, *pl;
250 250 Py_ssize_t nbytes, pos, l;
251 251 PyObject *k, *v, *pn;
252 252 char *p, *s;
253 253 double now;
254 254
255 255 if (!PyArg_ParseTuple(args, "O!O!Od:pack_dirstate",
256 256 &PyDict_Type, &map, &PyDict_Type, &copymap,
257 257 &pl, &now))
258 258 return NULL;
259 259
260 260 if (!PySequence_Check(pl) || PySequence_Size(pl) != 2) {
261 261 PyErr_SetString(PyExc_TypeError, "expected 2-element sequence");
262 262 return NULL;
263 263 }
264 264
265 265 /* Figure out how much we need to allocate. */
266 266 for (nbytes = 40, pos = 0; PyDict_Next(map, &pos, &k, &v);) {
267 267 PyObject *c;
268 268 if (!PyString_Check(k)) {
269 269 PyErr_SetString(PyExc_TypeError, "expected string key");
270 270 goto bail;
271 271 }
272 272 nbytes += PyString_GET_SIZE(k) + 17;
273 273 c = PyDict_GetItem(copymap, k);
274 274 if (c) {
275 275 if (!PyString_Check(c)) {
276 276 PyErr_SetString(PyExc_TypeError,
277 277 "expected string key");
278 278 goto bail;
279 279 }
280 280 nbytes += PyString_GET_SIZE(c) + 1;
281 281 }
282 282 }
283 283
284 284 packobj = PyString_FromStringAndSize(NULL, nbytes);
285 285 if (packobj == NULL)
286 286 goto bail;
287 287
288 288 p = PyString_AS_STRING(packobj);
289 289
290 290 pn = PySequence_ITEM(pl, 0);
291 291 if (PyString_AsStringAndSize(pn, &s, &l) == -1 || l != 20) {
292 292 PyErr_SetString(PyExc_TypeError, "expected a 20-byte hash");
293 293 goto bail;
294 294 }
295 295 memcpy(p, s, l);
296 296 p += 20;
297 297 pn = PySequence_ITEM(pl, 1);
298 298 if (PyString_AsStringAndSize(pn, &s, &l) == -1 || l != 20) {
299 299 PyErr_SetString(PyExc_TypeError, "expected a 20-byte hash");
300 300 goto bail;
301 301 }
302 302 memcpy(p, s, l);
303 303 p += 20;
304 304
305 305 for (pos = 0; PyDict_Next(map, &pos, &k, &v); ) {
306 306 uint32_t mode, size, mtime;
307 307 Py_ssize_t len, l;
308 308 PyObject *o;
309 309 char *s, *t;
310 int err;
311 310
312 311 if (!PyTuple_Check(v) || PyTuple_GET_SIZE(v) != 4) {
313 312 PyErr_SetString(PyExc_TypeError, "expected a 4-tuple");
314 313 goto bail;
315 314 }
316 315 o = PyTuple_GET_ITEM(v, 0);
317 316 if (PyString_AsStringAndSize(o, &s, &l) == -1 || l != 1) {
318 317 PyErr_SetString(PyExc_TypeError, "expected one byte");
319 318 goto bail;
320 319 }
321 320 *p++ = *s;
322 err = getintat(v, 1, &mode);
323 err |= getintat(v, 2, &size);
324 err |= getintat(v, 3, &mtime);
325 if (err)
321 if (getintat(v, 1, &mode) == -1)
322 goto bail;
323 if (getintat(v, 2, &size) == -1)
324 goto bail;
325 if (getintat(v, 3, &mtime) == -1)
326 326 goto bail;
327 327 if (*s == 'n' && mtime == (uint32_t)now) {
328 328 /* See dirstate.py:write for why we do this. */
329 329 if (PyDict_SetItem(map, k, dirstate_unset) == -1)
330 330 goto bail;
331 331 mode = 0, size = -1, mtime = -1;
332 332 }
333 333 putbe32(mode, p);
334 334 putbe32(size, p + 4);
335 335 putbe32(mtime, p + 8);
336 336 t = p + 12;
337 337 p += 16;
338 338 len = PyString_GET_SIZE(k);
339 339 memcpy(p, PyString_AS_STRING(k), len);
340 340 p += len;
341 341 o = PyDict_GetItem(copymap, k);
342 342 if (o) {
343 343 *p++ = '\0';
344 344 l = PyString_GET_SIZE(o);
345 345 memcpy(p, PyString_AS_STRING(o), l);
346 346 p += l;
347 347 len += l + 1;
348 348 }
349 349 putbe32((uint32_t)len, t);
350 350 }
351 351
352 352 pos = p - PyString_AS_STRING(packobj);
353 353 if (pos != nbytes) {
354 354 PyErr_Format(PyExc_SystemError, "bad dirstate size: %ld != %ld",
355 355 (long)pos, (long)nbytes);
356 356 goto bail;
357 357 }
358 358
359 359 return packobj;
360 360 bail:
361 361 Py_XDECREF(packobj);
362 362 return NULL;
363 363 }
364 364
365 365 /*
366 366 * A base-16 trie for fast node->rev mapping.
367 367 *
368 368 * Positive value is index of the next node in the trie
369 369 * Negative value is a leaf: -(rev + 1)
370 370 * Zero is empty
371 371 */
372 372 typedef struct {
373 373 int children[16];
374 374 } nodetree;
375 375
376 376 /*
377 377 * This class has two behaviours.
378 378 *
379 379 * When used in a list-like way (with integer keys), we decode an
380 380 * entry in a RevlogNG index file on demand. Our last entry is a
381 381 * sentinel, always a nullid. We have limited support for
382 382 * integer-keyed insert and delete, only at elements right before the
383 383 * sentinel.
384 384 *
385 385 * With string keys, we lazily perform a reverse mapping from node to
386 386 * rev, using a base-16 trie.
387 387 */
388 388 typedef struct {
389 389 PyObject_HEAD
390 390 /* Type-specific fields go here. */
391 391 PyObject *data; /* raw bytes of index */
392 392 PyObject **cache; /* cached tuples */
393 393 const char **offsets; /* populated on demand */
394 394 Py_ssize_t raw_length; /* original number of elements */
395 395 Py_ssize_t length; /* current number of elements */
396 396 PyObject *added; /* populated on demand */
397 397 PyObject *headrevs; /* cache, invalidated on changes */
398 398 nodetree *nt; /* base-16 trie */
399 399 int ntlength; /* # nodes in use */
400 400 int ntcapacity; /* # nodes allocated */
401 401 int ntdepth; /* maximum depth of tree */
402 402 int ntsplits; /* # splits performed */
403 403 int ntrev; /* last rev scanned */
404 404 int ntlookups; /* # lookups */
405 405 int ntmisses; /* # lookups that miss the cache */
406 406 int inlined;
407 407 } indexObject;
408 408
409 409 static Py_ssize_t index_length(const indexObject *self)
410 410 {
411 411 if (self->added == NULL)
412 412 return self->length;
413 413 return self->length + PyList_GET_SIZE(self->added);
414 414 }
415 415
416 416 static PyObject *nullentry;
417 417 static const char nullid[20];
418 418
419 419 static long inline_scan(indexObject *self, const char **offsets);
420 420
421 421 #if LONG_MAX == 0x7fffffffL
422 422 static char *tuple_format = "Kiiiiiis#";
423 423 #else
424 424 static char *tuple_format = "kiiiiiis#";
425 425 #endif
426 426
427 427 /* A RevlogNG v1 index entry is 64 bytes long. */
428 428 static const long v1_hdrsize = 64;
429 429
430 430 /*
431 431 * Return a pointer to the beginning of a RevlogNG record.
432 432 */
433 433 static const char *index_deref(indexObject *self, Py_ssize_t pos)
434 434 {
435 435 if (self->inlined && pos > 0) {
436 436 if (self->offsets == NULL) {
437 437 self->offsets = malloc(self->raw_length *
438 438 sizeof(*self->offsets));
439 439 if (self->offsets == NULL)
440 440 return (const char *)PyErr_NoMemory();
441 441 inline_scan(self, self->offsets);
442 442 }
443 443 return self->offsets[pos];
444 444 }
445 445
446 446 return PyString_AS_STRING(self->data) + pos * v1_hdrsize;
447 447 }
448 448
449 449 /*
450 450 * RevlogNG format (all in big endian, data may be inlined):
451 451 * 6 bytes: offset
452 452 * 2 bytes: flags
453 453 * 4 bytes: compressed length
454 454 * 4 bytes: uncompressed length
455 455 * 4 bytes: base revision
456 456 * 4 bytes: link revision
457 457 * 4 bytes: parent 1 revision
458 458 * 4 bytes: parent 2 revision
459 459 * 32 bytes: nodeid (only 20 bytes used)
460 460 */
461 461 static PyObject *index_get(indexObject *self, Py_ssize_t pos)
462 462 {
463 463 uint64_t offset_flags;
464 464 int comp_len, uncomp_len, base_rev, link_rev, parent_1, parent_2;
465 465 const char *c_node_id;
466 466 const char *data;
467 467 Py_ssize_t length = index_length(self);
468 468 PyObject *entry;
469 469
470 470 if (pos < 0)
471 471 pos += length;
472 472
473 473 if (pos < 0 || pos >= length) {
474 474 PyErr_SetString(PyExc_IndexError, "revlog index out of range");
475 475 return NULL;
476 476 }
477 477
478 478 if (pos == length - 1) {
479 479 Py_INCREF(nullentry);
480 480 return nullentry;
481 481 }
482 482
483 483 if (pos >= self->length - 1) {
484 484 PyObject *obj;
485 485 obj = PyList_GET_ITEM(self->added, pos - self->length + 1);
486 486 Py_INCREF(obj);
487 487 return obj;
488 488 }
489 489
490 490 if (self->cache) {
491 491 if (self->cache[pos]) {
492 492 Py_INCREF(self->cache[pos]);
493 493 return self->cache[pos];
494 494 }
495 495 } else {
496 496 self->cache = calloc(self->raw_length, sizeof(PyObject *));
497 497 if (self->cache == NULL)
498 498 return PyErr_NoMemory();
499 499 }
500 500
501 501 data = index_deref(self, pos);
502 502 if (data == NULL)
503 503 return NULL;
504 504
505 505 offset_flags = getbe32(data + 4);
506 506 if (pos == 0) /* mask out version number for the first entry */
507 507 offset_flags &= 0xFFFF;
508 508 else {
509 509 uint32_t offset_high = getbe32(data);
510 510 offset_flags |= ((uint64_t)offset_high) << 32;
511 511 }
512 512
513 513 comp_len = getbe32(data + 8);
514 514 uncomp_len = getbe32(data + 12);
515 515 base_rev = getbe32(data + 16);
516 516 link_rev = getbe32(data + 20);
517 517 parent_1 = getbe32(data + 24);
518 518 parent_2 = getbe32(data + 28);
519 519 c_node_id = data + 32;
520 520
521 521 entry = Py_BuildValue(tuple_format, offset_flags, comp_len,
522 522 uncomp_len, base_rev, link_rev,
523 523 parent_1, parent_2, c_node_id, 20);
524 524
525 525 if (entry)
526 526 PyObject_GC_UnTrack(entry);
527 527
528 528 self->cache[pos] = entry;
529 529 Py_INCREF(entry);
530 530
531 531 return entry;
532 532 }
533 533
534 534 /*
535 535 * Return the 20-byte SHA of the node corresponding to the given rev.
536 536 */
537 537 static const char *index_node(indexObject *self, Py_ssize_t pos)
538 538 {
539 539 Py_ssize_t length = index_length(self);
540 540 const char *data;
541 541
542 542 if (pos == length - 1 || pos == INT_MAX)
543 543 return nullid;
544 544
545 545 if (pos >= length)
546 546 return NULL;
547 547
548 548 if (pos >= self->length - 1) {
549 549 PyObject *tuple, *str;
550 550 tuple = PyList_GET_ITEM(self->added, pos - self->length + 1);
551 551 str = PyTuple_GetItem(tuple, 7);
552 552 return str ? PyString_AS_STRING(str) : NULL;
553 553 }
554 554
555 555 data = index_deref(self, pos);
556 556 return data ? data + 32 : NULL;
557 557 }
558 558
559 559 static int nt_insert(indexObject *self, const char *node, int rev);
560 560
561 561 static int node_check(PyObject *obj, char **node, Py_ssize_t *nodelen)
562 562 {
563 563 if (PyString_AsStringAndSize(obj, node, nodelen) == -1)
564 564 return -1;
565 565 if (*nodelen == 20)
566 566 return 0;
567 567 PyErr_SetString(PyExc_ValueError, "20-byte hash required");
568 568 return -1;
569 569 }
570 570
571 571 static PyObject *index_insert(indexObject *self, PyObject *args)
572 572 {
573 573 PyObject *obj;
574 574 char *node;
575 575 long offset;
576 576 Py_ssize_t len, nodelen;
577 577
578 578 if (!PyArg_ParseTuple(args, "lO", &offset, &obj))
579 579 return NULL;
580 580
581 581 if (!PyTuple_Check(obj) || PyTuple_GET_SIZE(obj) != 8) {
582 582 PyErr_SetString(PyExc_TypeError, "8-tuple required");
583 583 return NULL;
584 584 }
585 585
586 586 if (node_check(PyTuple_GET_ITEM(obj, 7), &node, &nodelen) == -1)
587 587 return NULL;
588 588
589 589 len = index_length(self);
590 590
591 591 if (offset < 0)
592 592 offset += len;
593 593
594 594 if (offset != len - 1) {
595 595 PyErr_SetString(PyExc_IndexError,
596 596 "insert only supported at index -1");
597 597 return NULL;
598 598 }
599 599
600 600 if (offset > INT_MAX) {
601 601 PyErr_SetString(PyExc_ValueError,
602 602 "currently only 2**31 revs supported");
603 603 return NULL;
604 604 }
605 605
606 606 if (self->added == NULL) {
607 607 self->added = PyList_New(0);
608 608 if (self->added == NULL)
609 609 return NULL;
610 610 }
611 611
612 612 if (PyList_Append(self->added, obj) == -1)
613 613 return NULL;
614 614
615 615 if (self->nt)
616 616 nt_insert(self, node, (int)offset);
617 617
618 618 Py_CLEAR(self->headrevs);
619 619 Py_RETURN_NONE;
620 620 }
621 621
622 622 static void _index_clearcaches(indexObject *self)
623 623 {
624 624 if (self->cache) {
625 625 Py_ssize_t i;
626 626
627 627 for (i = 0; i < self->raw_length; i++)
628 628 Py_CLEAR(self->cache[i]);
629 629 free(self->cache);
630 630 self->cache = NULL;
631 631 }
632 632 if (self->offsets) {
633 633 free(self->offsets);
634 634 self->offsets = NULL;
635 635 }
636 636 if (self->nt) {
637 637 free(self->nt);
638 638 self->nt = NULL;
639 639 }
640 640 Py_CLEAR(self->headrevs);
641 641 }
642 642
643 643 static PyObject *index_clearcaches(indexObject *self)
644 644 {
645 645 _index_clearcaches(self);
646 646 self->ntlength = self->ntcapacity = 0;
647 647 self->ntdepth = self->ntsplits = 0;
648 648 self->ntrev = -1;
649 649 self->ntlookups = self->ntmisses = 0;
650 650 Py_RETURN_NONE;
651 651 }
652 652
653 653 static PyObject *index_stats(indexObject *self)
654 654 {
655 655 PyObject *obj = PyDict_New();
656 656
657 657 if (obj == NULL)
658 658 return NULL;
659 659
660 660 #define istat(__n, __d) \
661 661 if (PyDict_SetItemString(obj, __d, PyInt_FromSsize_t(self->__n)) == -1) \
662 662 goto bail;
663 663
664 664 if (self->added) {
665 665 Py_ssize_t len = PyList_GET_SIZE(self->added);
666 666 if (PyDict_SetItemString(obj, "index entries added",
667 667 PyInt_FromSsize_t(len)) == -1)
668 668 goto bail;
669 669 }
670 670
671 671 if (self->raw_length != self->length - 1)
672 672 istat(raw_length, "revs on disk");
673 673 istat(length, "revs in memory");
674 674 istat(ntcapacity, "node trie capacity");
675 675 istat(ntdepth, "node trie depth");
676 676 istat(ntlength, "node trie count");
677 677 istat(ntlookups, "node trie lookups");
678 678 istat(ntmisses, "node trie misses");
679 679 istat(ntrev, "node trie last rev scanned");
680 680 istat(ntsplits, "node trie splits");
681 681
682 682 #undef istat
683 683
684 684 return obj;
685 685
686 686 bail:
687 687 Py_XDECREF(obj);
688 688 return NULL;
689 689 }
690 690
691 691 /*
692 692 * When we cache a list, we want to be sure the caller can't mutate
693 693 * the cached copy.
694 694 */
695 695 static PyObject *list_copy(PyObject *list)
696 696 {
697 697 Py_ssize_t len = PyList_GET_SIZE(list);
698 698 PyObject *newlist = PyList_New(len);
699 699 Py_ssize_t i;
700 700
701 701 if (newlist == NULL)
702 702 return NULL;
703 703
704 704 for (i = 0; i < len; i++) {
705 705 PyObject *obj = PyList_GET_ITEM(list, i);
706 706 Py_INCREF(obj);
707 707 PyList_SET_ITEM(newlist, i, obj);
708 708 }
709 709
710 710 return newlist;
711 711 }
712 712
713 713 static PyObject *index_headrevs(indexObject *self)
714 714 {
715 715 Py_ssize_t i, len, addlen;
716 716 char *nothead = NULL;
717 717 PyObject *heads;
718 718
719 719 if (self->headrevs)
720 720 return list_copy(self->headrevs);
721 721
722 722 len = index_length(self) - 1;
723 723 heads = PyList_New(0);
724 724 if (heads == NULL)
725 725 goto bail;
726 726 if (len == 0) {
727 727 PyObject *nullid = PyInt_FromLong(-1);
728 728 if (nullid == NULL || PyList_Append(heads, nullid) == -1) {
729 729 Py_XDECREF(nullid);
730 730 goto bail;
731 731 }
732 732 goto done;
733 733 }
734 734
735 735 nothead = calloc(len, 1);
736 736 if (nothead == NULL)
737 737 goto bail;
738 738
739 739 for (i = 0; i < self->raw_length; i++) {
740 740 const char *data = index_deref(self, i);
741 741 int parent_1 = getbe32(data + 24);
742 742 int parent_2 = getbe32(data + 28);
743 743 if (parent_1 >= 0)
744 744 nothead[parent_1] = 1;
745 745 if (parent_2 >= 0)
746 746 nothead[parent_2] = 1;
747 747 }
748 748
749 749 addlen = self->added ? PyList_GET_SIZE(self->added) : 0;
750 750
751 751 for (i = 0; i < addlen; i++) {
752 752 PyObject *rev = PyList_GET_ITEM(self->added, i);
753 753 PyObject *p1 = PyTuple_GET_ITEM(rev, 5);
754 754 PyObject *p2 = PyTuple_GET_ITEM(rev, 6);
755 755 long parent_1, parent_2;
756 756
757 757 if (!PyInt_Check(p1) || !PyInt_Check(p2)) {
758 758 PyErr_SetString(PyExc_TypeError,
759 759 "revlog parents are invalid");
760 760 goto bail;
761 761 }
762 762 parent_1 = PyInt_AS_LONG(p1);
763 763 parent_2 = PyInt_AS_LONG(p2);
764 764 if (parent_1 >= 0)
765 765 nothead[parent_1] = 1;
766 766 if (parent_2 >= 0)
767 767 nothead[parent_2] = 1;
768 768 }
769 769
770 770 for (i = 0; i < len; i++) {
771 771 PyObject *head;
772 772
773 773 if (nothead[i])
774 774 continue;
775 775 head = PyInt_FromLong(i);
776 776 if (head == NULL || PyList_Append(heads, head) == -1) {
777 777 Py_XDECREF(head);
778 778 goto bail;
779 779 }
780 780 }
781 781
782 782 done:
783 783 self->headrevs = heads;
784 784 free(nothead);
785 785 return list_copy(self->headrevs);
786 786 bail:
787 787 Py_XDECREF(heads);
788 788 free(nothead);
789 789 return NULL;
790 790 }
791 791
792 792 static inline int nt_level(const char *node, Py_ssize_t level)
793 793 {
794 794 int v = node[level>>1];
795 795 if (!(level & 1))
796 796 v >>= 4;
797 797 return v & 0xf;
798 798 }
799 799
800 800 /*
801 801 * Return values:
802 802 *
803 803 * -4: match is ambiguous (multiple candidates)
804 804 * -2: not found
805 805 * rest: valid rev
806 806 */
807 807 static int nt_find(indexObject *self, const char *node, Py_ssize_t nodelen,
808 808 int hex)
809 809 {
810 810 int (*getnybble)(const char *, Py_ssize_t) = hex ? hexdigit : nt_level;
811 811 int level, maxlevel, off;
812 812
813 813 if (nodelen == 20 && node[0] == '\0' && memcmp(node, nullid, 20) == 0)
814 814 return -1;
815 815
816 816 if (self->nt == NULL)
817 817 return -2;
818 818
819 819 if (hex)
820 820 maxlevel = nodelen > 40 ? 40 : (int)nodelen;
821 821 else
822 822 maxlevel = nodelen > 20 ? 40 : ((int)nodelen * 2);
823 823
824 824 for (level = off = 0; level < maxlevel; level++) {
825 825 int k = getnybble(node, level);
826 826 nodetree *n = &self->nt[off];
827 827 int v = n->children[k];
828 828
829 829 if (v < 0) {
830 830 const char *n;
831 831 Py_ssize_t i;
832 832
833 833 v = -v - 1;
834 834 n = index_node(self, v);
835 835 if (n == NULL)
836 836 return -2;
837 837 for (i = level; i < maxlevel; i++)
838 838 if (getnybble(node, i) != nt_level(n, i))
839 839 return -2;
840 840 return v;
841 841 }
842 842 if (v == 0)
843 843 return -2;
844 844 off = v;
845 845 }
846 846 /* multiple matches against an ambiguous prefix */
847 847 return -4;
848 848 }
849 849
850 850 static int nt_new(indexObject *self)
851 851 {
852 852 if (self->ntlength == self->ntcapacity) {
853 853 self->ntcapacity *= 2;
854 854 self->nt = realloc(self->nt,
855 855 self->ntcapacity * sizeof(nodetree));
856 856 if (self->nt == NULL) {
857 857 PyErr_SetString(PyExc_MemoryError, "out of memory");
858 858 return -1;
859 859 }
860 860 memset(&self->nt[self->ntlength], 0,
861 861 sizeof(nodetree) * (self->ntcapacity - self->ntlength));
862 862 }
863 863 return self->ntlength++;
864 864 }
865 865
866 866 static int nt_insert(indexObject *self, const char *node, int rev)
867 867 {
868 868 int level = 0;
869 869 int off = 0;
870 870
871 871 while (level < 40) {
872 872 int k = nt_level(node, level);
873 873 nodetree *n;
874 874 int v;
875 875
876 876 n = &self->nt[off];
877 877 v = n->children[k];
878 878
879 879 if (v == 0) {
880 880 n->children[k] = -rev - 1;
881 881 return 0;
882 882 }
883 883 if (v < 0) {
884 884 const char *oldnode = index_node(self, -v - 1);
885 885 int noff;
886 886
887 887 if (!oldnode || !memcmp(oldnode, node, 20)) {
888 888 n->children[k] = -rev - 1;
889 889 return 0;
890 890 }
891 891 noff = nt_new(self);
892 892 if (noff == -1)
893 893 return -1;
894 894 /* self->nt may have been changed by realloc */
895 895 self->nt[off].children[k] = noff;
896 896 off = noff;
897 897 n = &self->nt[off];
898 898 n->children[nt_level(oldnode, ++level)] = v;
899 899 if (level > self->ntdepth)
900 900 self->ntdepth = level;
901 901 self->ntsplits += 1;
902 902 } else {
903 903 level += 1;
904 904 off = v;
905 905 }
906 906 }
907 907
908 908 return -1;
909 909 }
910 910
911 911 static int nt_init(indexObject *self)
912 912 {
913 913 if (self->nt == NULL) {
914 914 self->ntcapacity = self->raw_length < 4
915 915 ? 4 : self->raw_length / 2;
916 916 self->nt = calloc(self->ntcapacity, sizeof(nodetree));
917 917 if (self->nt == NULL) {
918 918 PyErr_NoMemory();
919 919 return -1;
920 920 }
921 921 self->ntlength = 1;
922 922 self->ntrev = (int)index_length(self) - 1;
923 923 self->ntlookups = 1;
924 924 self->ntmisses = 0;
925 925 if (nt_insert(self, nullid, INT_MAX) == -1)
926 926 return -1;
927 927 }
928 928 return 0;
929 929 }
930 930
931 931 /*
932 932 * Return values:
933 933 *
934 934 * -3: error (exception set)
935 935 * -2: not found (no exception set)
936 936 * rest: valid rev
937 937 */
938 938 static int index_find_node(indexObject *self,
939 939 const char *node, Py_ssize_t nodelen)
940 940 {
941 941 int rev;
942 942
943 943 self->ntlookups++;
944 944 rev = nt_find(self, node, nodelen, 0);
945 945 if (rev >= -1)
946 946 return rev;
947 947
948 948 if (nt_init(self) == -1)
949 949 return -3;
950 950
951 951 /*
952 952 * For the first handful of lookups, we scan the entire index,
953 953 * and cache only the matching nodes. This optimizes for cases
954 954 * like "hg tip", where only a few nodes are accessed.
955 955 *
956 956 * After that, we cache every node we visit, using a single
957 957 * scan amortized over multiple lookups. This gives the best
958 958 * bulk performance, e.g. for "hg log".
959 959 */
960 960 if (self->ntmisses++ < 4) {
961 961 for (rev = self->ntrev - 1; rev >= 0; rev--) {
962 962 const char *n = index_node(self, rev);
963 963 if (n == NULL)
964 964 return -2;
965 965 if (memcmp(node, n, nodelen > 20 ? 20 : nodelen) == 0) {
966 966 if (nt_insert(self, n, rev) == -1)
967 967 return -3;
968 968 break;
969 969 }
970 970 }
971 971 } else {
972 972 for (rev = self->ntrev - 1; rev >= 0; rev--) {
973 973 const char *n = index_node(self, rev);
974 974 if (n == NULL) {
975 975 self->ntrev = rev + 1;
976 976 return -2;
977 977 }
978 978 if (nt_insert(self, n, rev) == -1) {
979 979 self->ntrev = rev + 1;
980 980 return -3;
981 981 }
982 982 if (memcmp(node, n, nodelen > 20 ? 20 : nodelen) == 0) {
983 983 break;
984 984 }
985 985 }
986 986 self->ntrev = rev;
987 987 }
988 988
989 989 if (rev >= 0)
990 990 return rev;
991 991 return -2;
992 992 }
993 993
994 994 static PyObject *raise_revlog_error(void)
995 995 {
996 996 static PyObject *errclass;
997 997 PyObject *mod = NULL, *errobj;
998 998
999 999 if (errclass == NULL) {
1000 1000 PyObject *dict;
1001 1001
1002 1002 mod = PyImport_ImportModule("mercurial.error");
1003 1003 if (mod == NULL)
1004 1004 goto classfail;
1005 1005
1006 1006 dict = PyModule_GetDict(mod);
1007 1007 if (dict == NULL)
1008 1008 goto classfail;
1009 1009
1010 1010 errclass = PyDict_GetItemString(dict, "RevlogError");
1011 1011 if (errclass == NULL) {
1012 1012 PyErr_SetString(PyExc_SystemError,
1013 1013 "could not find RevlogError");
1014 1014 goto classfail;
1015 1015 }
1016 1016 Py_INCREF(errclass);
1017 1017 }
1018 1018
1019 1019 errobj = PyObject_CallFunction(errclass, NULL);
1020 1020 if (errobj == NULL)
1021 1021 return NULL;
1022 1022 PyErr_SetObject(errclass, errobj);
1023 1023 return errobj;
1024 1024
1025 1025 classfail:
1026 1026 Py_XDECREF(mod);
1027 1027 return NULL;
1028 1028 }
1029 1029
1030 1030 static PyObject *index_getitem(indexObject *self, PyObject *value)
1031 1031 {
1032 1032 char *node;
1033 1033 Py_ssize_t nodelen;
1034 1034 int rev;
1035 1035
1036 1036 if (PyInt_Check(value))
1037 1037 return index_get(self, PyInt_AS_LONG(value));
1038 1038
1039 1039 if (node_check(value, &node, &nodelen) == -1)
1040 1040 return NULL;
1041 1041 rev = index_find_node(self, node, nodelen);
1042 1042 if (rev >= -1)
1043 1043 return PyInt_FromLong(rev);
1044 1044 if (rev == -2)
1045 1045 raise_revlog_error();
1046 1046 return NULL;
1047 1047 }
1048 1048
1049 1049 static int nt_partialmatch(indexObject *self, const char *node,
1050 1050 Py_ssize_t nodelen)
1051 1051 {
1052 1052 int rev;
1053 1053
1054 1054 if (nt_init(self) == -1)
1055 1055 return -3;
1056 1056
1057 1057 if (self->ntrev > 0) {
1058 1058 /* ensure that the radix tree is fully populated */
1059 1059 for (rev = self->ntrev - 1; rev >= 0; rev--) {
1060 1060 const char *n = index_node(self, rev);
1061 1061 if (n == NULL)
1062 1062 return -2;
1063 1063 if (nt_insert(self, n, rev) == -1)
1064 1064 return -3;
1065 1065 }
1066 1066 self->ntrev = rev;
1067 1067 }
1068 1068
1069 1069 return nt_find(self, node, nodelen, 1);
1070 1070 }
1071 1071
1072 1072 static PyObject *index_partialmatch(indexObject *self, PyObject *args)
1073 1073 {
1074 1074 const char *fullnode;
1075 1075 int nodelen;
1076 1076 char *node;
1077 1077 int rev, i;
1078 1078
1079 1079 if (!PyArg_ParseTuple(args, "s#", &node, &nodelen))
1080 1080 return NULL;
1081 1081
1082 1082 if (nodelen < 4) {
1083 1083 PyErr_SetString(PyExc_ValueError, "key too short");
1084 1084 return NULL;
1085 1085 }
1086 1086
1087 1087 if (nodelen > 40)
1088 1088 nodelen = 40;
1089 1089
1090 1090 for (i = 0; i < nodelen; i++)
1091 1091 hexdigit(node, i);
1092 1092 if (PyErr_Occurred()) {
1093 1093 /* input contains non-hex characters */
1094 1094 PyErr_Clear();
1095 1095 Py_RETURN_NONE;
1096 1096 }
1097 1097
1098 1098 rev = nt_partialmatch(self, node, nodelen);
1099 1099
1100 1100 switch (rev) {
1101 1101 case -4:
1102 1102 raise_revlog_error();
1103 1103 case -3:
1104 1104 return NULL;
1105 1105 case -2:
1106 1106 Py_RETURN_NONE;
1107 1107 case -1:
1108 1108 return PyString_FromStringAndSize(nullid, 20);
1109 1109 }
1110 1110
1111 1111 fullnode = index_node(self, rev);
1112 1112 if (fullnode == NULL) {
1113 1113 PyErr_Format(PyExc_IndexError,
1114 1114 "could not access rev %d", rev);
1115 1115 return NULL;
1116 1116 }
1117 1117 return PyString_FromStringAndSize(fullnode, 20);
1118 1118 }
1119 1119
1120 1120 static PyObject *index_m_get(indexObject *self, PyObject *args)
1121 1121 {
1122 1122 Py_ssize_t nodelen;
1123 1123 PyObject *val;
1124 1124 char *node;
1125 1125 int rev;
1126 1126
1127 1127 if (!PyArg_ParseTuple(args, "O", &val))
1128 1128 return NULL;
1129 1129 if (node_check(val, &node, &nodelen) == -1)
1130 1130 return NULL;
1131 1131 rev = index_find_node(self, node, nodelen);
1132 1132 if (rev == -3)
1133 1133 return NULL;
1134 1134 if (rev == -2)
1135 1135 Py_RETURN_NONE;
1136 1136 return PyInt_FromLong(rev);
1137 1137 }
1138 1138
1139 1139 static int index_contains(indexObject *self, PyObject *value)
1140 1140 {
1141 1141 char *node;
1142 1142 Py_ssize_t nodelen;
1143 1143
1144 1144 if (PyInt_Check(value)) {
1145 1145 long rev = PyInt_AS_LONG(value);
1146 1146 return rev >= -1 && rev < index_length(self);
1147 1147 }
1148 1148
1149 1149 if (node_check(value, &node, &nodelen) == -1)
1150 1150 return -1;
1151 1151
1152 1152 switch (index_find_node(self, node, nodelen)) {
1153 1153 case -3:
1154 1154 return -1;
1155 1155 case -2:
1156 1156 return 0;
1157 1157 default:
1158 1158 return 1;
1159 1159 }
1160 1160 }
1161 1161
1162 1162 /*
1163 1163 * Invalidate any trie entries introduced by added revs.
1164 1164 */
1165 1165 static void nt_invalidate_added(indexObject *self, Py_ssize_t start)
1166 1166 {
1167 1167 Py_ssize_t i, len = PyList_GET_SIZE(self->added);
1168 1168
1169 1169 for (i = start; i < len; i++) {
1170 1170 PyObject *tuple = PyList_GET_ITEM(self->added, i);
1171 1171 PyObject *node = PyTuple_GET_ITEM(tuple, 7);
1172 1172
1173 1173 nt_insert(self, PyString_AS_STRING(node), -1);
1174 1174 }
1175 1175
1176 1176 if (start == 0)
1177 1177 Py_CLEAR(self->added);
1178 1178 }
1179 1179
1180 1180 /*
1181 1181 * Delete a numeric range of revs, which must be at the end of the
1182 1182 * range, but exclude the sentinel nullid entry.
1183 1183 */
1184 1184 static int index_slice_del(indexObject *self, PyObject *item)
1185 1185 {
1186 1186 Py_ssize_t start, stop, step, slicelength;
1187 1187 Py_ssize_t length = index_length(self);
1188 1188 int ret = 0;
1189 1189
1190 1190 if (PySlice_GetIndicesEx((PySliceObject*)item, length,
1191 1191 &start, &stop, &step, &slicelength) < 0)
1192 1192 return -1;
1193 1193
1194 1194 if (slicelength <= 0)
1195 1195 return 0;
1196 1196
1197 1197 if ((step < 0 && start < stop) || (step > 0 && start > stop))
1198 1198 stop = start;
1199 1199
1200 1200 if (step < 0) {
1201 1201 stop = start + 1;
1202 1202 start = stop + step*(slicelength - 1) - 1;
1203 1203 step = -step;
1204 1204 }
1205 1205
1206 1206 if (step != 1) {
1207 1207 PyErr_SetString(PyExc_ValueError,
1208 1208 "revlog index delete requires step size of 1");
1209 1209 return -1;
1210 1210 }
1211 1211
1212 1212 if (stop != length - 1) {
1213 1213 PyErr_SetString(PyExc_IndexError,
1214 1214 "revlog index deletion indices are invalid");
1215 1215 return -1;
1216 1216 }
1217 1217
1218 1218 if (start < self->length - 1) {
1219 1219 if (self->nt) {
1220 1220 Py_ssize_t i;
1221 1221
1222 1222 for (i = start + 1; i < self->length - 1; i++) {
1223 1223 const char *node = index_node(self, i);
1224 1224
1225 1225 if (node)
1226 1226 nt_insert(self, node, -1);
1227 1227 }
1228 1228 if (self->added)
1229 1229 nt_invalidate_added(self, 0);
1230 1230 if (self->ntrev > start)
1231 1231 self->ntrev = (int)start;
1232 1232 }
1233 1233 self->length = start + 1;
1234 1234 if (start < self->raw_length)
1235 1235 self->raw_length = start;
1236 1236 goto done;
1237 1237 }
1238 1238
1239 1239 if (self->nt) {
1240 1240 nt_invalidate_added(self, start - self->length + 1);
1241 1241 if (self->ntrev > start)
1242 1242 self->ntrev = (int)start;
1243 1243 }
1244 1244 if (self->added)
1245 1245 ret = PyList_SetSlice(self->added, start - self->length + 1,
1246 1246 PyList_GET_SIZE(self->added), NULL);
1247 1247 done:
1248 1248 Py_CLEAR(self->headrevs);
1249 1249 return ret;
1250 1250 }
1251 1251
1252 1252 /*
1253 1253 * Supported ops:
1254 1254 *
1255 1255 * slice deletion
1256 1256 * string assignment (extend node->rev mapping)
1257 1257 * string deletion (shrink node->rev mapping)
1258 1258 */
1259 1259 static int index_assign_subscript(indexObject *self, PyObject *item,
1260 1260 PyObject *value)
1261 1261 {
1262 1262 char *node;
1263 1263 Py_ssize_t nodelen;
1264 1264 long rev;
1265 1265
1266 1266 if (PySlice_Check(item) && value == NULL)
1267 1267 return index_slice_del(self, item);
1268 1268
1269 1269 if (node_check(item, &node, &nodelen) == -1)
1270 1270 return -1;
1271 1271
1272 1272 if (value == NULL)
1273 1273 return self->nt ? nt_insert(self, node, -1) : 0;
1274 1274 rev = PyInt_AsLong(value);
1275 1275 if (rev > INT_MAX || rev < 0) {
1276 1276 if (!PyErr_Occurred())
1277 1277 PyErr_SetString(PyExc_ValueError, "rev out of range");
1278 1278 return -1;
1279 1279 }
1280 1280 return nt_insert(self, node, (int)rev);
1281 1281 }
1282 1282
1283 1283 /*
1284 1284 * Find all RevlogNG entries in an index that has inline data. Update
1285 1285 * the optional "offsets" table with those entries.
1286 1286 */
1287 1287 static long inline_scan(indexObject *self, const char **offsets)
1288 1288 {
1289 1289 const char *data = PyString_AS_STRING(self->data);
1290 1290 const char *end = data + PyString_GET_SIZE(self->data);
1291 1291 long incr = v1_hdrsize;
1292 1292 Py_ssize_t len = 0;
1293 1293
1294 1294 while (data + v1_hdrsize <= end) {
1295 1295 uint32_t comp_len;
1296 1296 const char *old_data;
1297 1297 /* 3rd element of header is length of compressed inline data */
1298 1298 comp_len = getbe32(data + 8);
1299 1299 incr = v1_hdrsize + comp_len;
1300 1300 if (incr < v1_hdrsize)
1301 1301 break;
1302 1302 if (offsets)
1303 1303 offsets[len] = data;
1304 1304 len++;
1305 1305 old_data = data;
1306 1306 data += incr;
1307 1307 if (data <= old_data)
1308 1308 break;
1309 1309 }
1310 1310
1311 1311 if (data != end && data + v1_hdrsize != end) {
1312 1312 if (!PyErr_Occurred())
1313 1313 PyErr_SetString(PyExc_ValueError, "corrupt index file");
1314 1314 return -1;
1315 1315 }
1316 1316
1317 1317 return len;
1318 1318 }
1319 1319
1320 1320 static int index_init(indexObject *self, PyObject *args)
1321 1321 {
1322 1322 PyObject *data_obj, *inlined_obj;
1323 1323 Py_ssize_t size;
1324 1324
1325 1325 if (!PyArg_ParseTuple(args, "OO", &data_obj, &inlined_obj))
1326 1326 return -1;
1327 1327 if (!PyString_Check(data_obj)) {
1328 1328 PyErr_SetString(PyExc_TypeError, "data is not a string");
1329 1329 return -1;
1330 1330 }
1331 1331 size = PyString_GET_SIZE(data_obj);
1332 1332
1333 1333 self->inlined = inlined_obj && PyObject_IsTrue(inlined_obj);
1334 1334 self->data = data_obj;
1335 1335 self->cache = NULL;
1336 1336
1337 1337 self->added = NULL;
1338 1338 self->headrevs = NULL;
1339 1339 self->offsets = NULL;
1340 1340 self->nt = NULL;
1341 1341 self->ntlength = self->ntcapacity = 0;
1342 1342 self->ntdepth = self->ntsplits = 0;
1343 1343 self->ntlookups = self->ntmisses = 0;
1344 1344 self->ntrev = -1;
1345 1345 Py_INCREF(self->data);
1346 1346
1347 1347 if (self->inlined) {
1348 1348 long len = inline_scan(self, NULL);
1349 1349 if (len == -1)
1350 1350 goto bail;
1351 1351 self->raw_length = len;
1352 1352 self->length = len + 1;
1353 1353 } else {
1354 1354 if (size % v1_hdrsize) {
1355 1355 PyErr_SetString(PyExc_ValueError, "corrupt index file");
1356 1356 goto bail;
1357 1357 }
1358 1358 self->raw_length = size / v1_hdrsize;
1359 1359 self->length = self->raw_length + 1;
1360 1360 }
1361 1361
1362 1362 return 0;
1363 1363 bail:
1364 1364 return -1;
1365 1365 }
1366 1366
1367 1367 static PyObject *index_nodemap(indexObject *self)
1368 1368 {
1369 1369 Py_INCREF(self);
1370 1370 return (PyObject *)self;
1371 1371 }
1372 1372
1373 1373 static void index_dealloc(indexObject *self)
1374 1374 {
1375 1375 _index_clearcaches(self);
1376 1376 Py_DECREF(self->data);
1377 1377 Py_XDECREF(self->added);
1378 1378 PyObject_Del(self);
1379 1379 }
1380 1380
1381 1381 static PySequenceMethods index_sequence_methods = {
1382 1382 (lenfunc)index_length, /* sq_length */
1383 1383 0, /* sq_concat */
1384 1384 0, /* sq_repeat */
1385 1385 (ssizeargfunc)index_get, /* sq_item */
1386 1386 0, /* sq_slice */
1387 1387 0, /* sq_ass_item */
1388 1388 0, /* sq_ass_slice */
1389 1389 (objobjproc)index_contains, /* sq_contains */
1390 1390 };
1391 1391
1392 1392 static PyMappingMethods index_mapping_methods = {
1393 1393 (lenfunc)index_length, /* mp_length */
1394 1394 (binaryfunc)index_getitem, /* mp_subscript */
1395 1395 (objobjargproc)index_assign_subscript, /* mp_ass_subscript */
1396 1396 };
1397 1397
1398 1398 static PyMethodDef index_methods[] = {
1399 1399 {"clearcaches", (PyCFunction)index_clearcaches, METH_NOARGS,
1400 1400 "clear the index caches"},
1401 1401 {"get", (PyCFunction)index_m_get, METH_VARARGS,
1402 1402 "get an index entry"},
1403 1403 {"headrevs", (PyCFunction)index_headrevs, METH_NOARGS,
1404 1404 "get head revisions"},
1405 1405 {"insert", (PyCFunction)index_insert, METH_VARARGS,
1406 1406 "insert an index entry"},
1407 1407 {"partialmatch", (PyCFunction)index_partialmatch, METH_VARARGS,
1408 1408 "match a potentially ambiguous node ID"},
1409 1409 {"stats", (PyCFunction)index_stats, METH_NOARGS,
1410 1410 "stats for the index"},
1411 1411 {NULL} /* Sentinel */
1412 1412 };
1413 1413
1414 1414 static PyGetSetDef index_getset[] = {
1415 1415 {"nodemap", (getter)index_nodemap, NULL, "nodemap", NULL},
1416 1416 {NULL} /* Sentinel */
1417 1417 };
1418 1418
1419 1419 static PyTypeObject indexType = {
1420 1420 PyObject_HEAD_INIT(NULL)
1421 1421 0, /* ob_size */
1422 1422 "parsers.index", /* tp_name */
1423 1423 sizeof(indexObject), /* tp_basicsize */
1424 1424 0, /* tp_itemsize */
1425 1425 (destructor)index_dealloc, /* tp_dealloc */
1426 1426 0, /* tp_print */
1427 1427 0, /* tp_getattr */
1428 1428 0, /* tp_setattr */
1429 1429 0, /* tp_compare */
1430 1430 0, /* tp_repr */
1431 1431 0, /* tp_as_number */
1432 1432 &index_sequence_methods, /* tp_as_sequence */
1433 1433 &index_mapping_methods, /* tp_as_mapping */
1434 1434 0, /* tp_hash */
1435 1435 0, /* tp_call */
1436 1436 0, /* tp_str */
1437 1437 0, /* tp_getattro */
1438 1438 0, /* tp_setattro */
1439 1439 0, /* tp_as_buffer */
1440 1440 Py_TPFLAGS_DEFAULT, /* tp_flags */
1441 1441 "revlog index", /* tp_doc */
1442 1442 0, /* tp_traverse */
1443 1443 0, /* tp_clear */
1444 1444 0, /* tp_richcompare */
1445 1445 0, /* tp_weaklistoffset */
1446 1446 0, /* tp_iter */
1447 1447 0, /* tp_iternext */
1448 1448 index_methods, /* tp_methods */
1449 1449 0, /* tp_members */
1450 1450 index_getset, /* tp_getset */
1451 1451 0, /* tp_base */
1452 1452 0, /* tp_dict */
1453 1453 0, /* tp_descr_get */
1454 1454 0, /* tp_descr_set */
1455 1455 0, /* tp_dictoffset */
1456 1456 (initproc)index_init, /* tp_init */
1457 1457 0, /* tp_alloc */
1458 1458 };
1459 1459
1460 1460 /*
1461 1461 * returns a tuple of the form (index, index, cache) with elements as
1462 1462 * follows:
1463 1463 *
1464 1464 * index: an index object that lazily parses RevlogNG records
1465 1465 * cache: if data is inlined, a tuple (index_file_content, 0), else None
1466 1466 *
1467 1467 * added complications are for backwards compatibility
1468 1468 */
1469 1469 static PyObject *parse_index2(PyObject *self, PyObject *args)
1470 1470 {
1471 1471 PyObject *tuple = NULL, *cache = NULL;
1472 1472 indexObject *idx;
1473 1473 int ret;
1474 1474
1475 1475 idx = PyObject_New(indexObject, &indexType);
1476 1476 if (idx == NULL)
1477 1477 goto bail;
1478 1478
1479 1479 ret = index_init(idx, args);
1480 1480 if (ret == -1)
1481 1481 goto bail;
1482 1482
1483 1483 if (idx->inlined) {
1484 1484 cache = Py_BuildValue("iO", 0, idx->data);
1485 1485 if (cache == NULL)
1486 1486 goto bail;
1487 1487 } else {
1488 1488 cache = Py_None;
1489 1489 Py_INCREF(cache);
1490 1490 }
1491 1491
1492 1492 tuple = Py_BuildValue("NN", idx, cache);
1493 1493 if (!tuple)
1494 1494 goto bail;
1495 1495 return tuple;
1496 1496
1497 1497 bail:
1498 1498 Py_XDECREF(idx);
1499 1499 Py_XDECREF(cache);
1500 1500 Py_XDECREF(tuple);
1501 1501 return NULL;
1502 1502 }
1503 1503
1504 1504 static char parsers_doc[] = "Efficient content parsing.";
1505 1505
1506 1506 static PyMethodDef methods[] = {
1507 1507 {"pack_dirstate", pack_dirstate, METH_VARARGS, "pack a dirstate\n"},
1508 1508 {"parse_manifest", parse_manifest, METH_VARARGS, "parse a manifest\n"},
1509 1509 {"parse_dirstate", parse_dirstate, METH_VARARGS, "parse a dirstate\n"},
1510 1510 {"parse_index2", parse_index2, METH_VARARGS, "parse a revlog index\n"},
1511 1511 {NULL, NULL}
1512 1512 };
1513 1513
1514 1514 static void module_init(PyObject *mod)
1515 1515 {
1516 1516 indexType.tp_new = PyType_GenericNew;
1517 1517 if (PyType_Ready(&indexType) < 0)
1518 1518 return;
1519 1519 Py_INCREF(&indexType);
1520 1520
1521 1521 PyModule_AddObject(mod, "index", (PyObject *)&indexType);
1522 1522
1523 1523 nullentry = Py_BuildValue("iiiiiiis#", 0, 0, 0,
1524 1524 -1, -1, -1, -1, nullid, 20);
1525 1525 if (nullentry)
1526 1526 PyObject_GC_UnTrack(nullentry);
1527 1527
1528 1528 dirstate_unset = Py_BuildValue("ciii", 'n', 0, -1, -1);
1529 1529 }
1530 1530
1531 1531 #ifdef IS_PY3K
1532 1532 static struct PyModuleDef parsers_module = {
1533 1533 PyModuleDef_HEAD_INIT,
1534 1534 "parsers",
1535 1535 parsers_doc,
1536 1536 -1,
1537 1537 methods
1538 1538 };
1539 1539
1540 1540 PyMODINIT_FUNC PyInit_parsers(void)
1541 1541 {
1542 1542 PyObject *mod = PyModule_Create(&parsers_module);
1543 1543 module_init(mod);
1544 1544 return mod;
1545 1545 }
1546 1546 #else
1547 1547 PyMODINIT_FUNC initparsers(void)
1548 1548 {
1549 1549 PyObject *mod = Py_InitModule3("parsers", methods, parsers_doc);
1550 1550 module_init(mod);
1551 1551 }
1552 1552 #endif
General Comments 0
You need to be logged in to leave comments. Login now