##// END OF EJS Templates
lazymanifest: fix memory leak in lmiter_iterentriesnext() after 3d485727e45e
Mike Hommey -
r24699:64cd23a1 default
parent child Browse files
Show More
@@ -1,919 +1,919 b''
1 1 /*
2 2 * manifest.c - manifest type that does on-demand parsing.
3 3 *
4 4 * Copyright 2015, Google Inc.
5 5 *
6 6 * This software may be used and distributed according to the terms of
7 7 * the GNU General Public License, incorporated herein by reference.
8 8 */
9 9 #include <Python.h>
10 10
11 11 #include <assert.h>
12 12 #include <string.h>
13 13 #include <stdlib.h>
14 14
15 15 #include "util.h"
16 16
17 17 #define DEFAULT_LINES 100000
18 18
19 19 typedef struct {
20 20 char *start;
21 21 Py_ssize_t len; /* length of line including terminal newline */
22 22 char hash_suffix;
23 23 bool from_malloc;
24 24 bool deleted;
25 25 } line;
26 26
27 27 typedef struct {
28 28 PyObject_HEAD
29 29 PyObject *pydata;
30 30 line *lines;
31 31 int numlines; /* number of line entries */
32 32 int livelines; /* number of non-deleted lines */
33 33 int maxlines; /* allocated number of lines */
34 34 bool dirty;
35 35 } lazymanifest;
36 36
37 37 #define MANIFEST_OOM -1
38 38 #define MANIFEST_NOT_SORTED -2
39 39 #define MANIFEST_MALFORMED -3
40 40
41 41 /* defined in parsers.c */
42 42 PyObject *unhexlify(const char *str, int len);
43 43
44 44 /* get the length of the path for a line */
45 45 static size_t pathlen(line *l) {
46 46 return strlen(l->start);
47 47 }
48 48
49 49 /* get the node value of a single line */
50 50 static PyObject *nodeof(line *l) {
51 51 char *s = l->start;
52 52 ssize_t llen = pathlen(l);
53 53 PyObject *hash = unhexlify(s + llen + 1, 40);
54 54 if (!hash) {
55 55 return NULL;
56 56 }
57 57 if (l->hash_suffix != '\0') {
58 58 char newhash[21];
59 59 memcpy(newhash, PyString_AsString(hash), 20);
60 60 Py_DECREF(hash);
61 61 newhash[20] = l->hash_suffix;
62 62 hash = PyString_FromStringAndSize(newhash, 21);
63 63 }
64 64 return hash;
65 65 }
66 66
67 67 /* get the node hash and flags of a line as a tuple */
68 68 static PyObject *hashflags(line *l)
69 69 {
70 70 char *s = l->start;
71 71 size_t plen = pathlen(l);
72 72 PyObject *hash = nodeof(l);
73 73
74 74 /* 40 for hash, 1 for null byte, 1 for newline */
75 75 size_t hplen = plen + 42;
76 76 Py_ssize_t flen = l->len - hplen;
77 77 PyObject *flags;
78 78 PyObject *tup;
79 79
80 80 if (!hash)
81 81 return NULL;
82 82 flags = PyString_FromStringAndSize(s + hplen - 1, flen);
83 83 if (!flags) {
84 84 Py_DECREF(hash);
85 85 return NULL;
86 86 }
87 87 tup = PyTuple_Pack(2, hash, flags);
88 88 Py_DECREF(flags);
89 89 Py_DECREF(hash);
90 90 return tup;
91 91 }
92 92
93 93 /* if we're about to run out of space in the line index, add more */
94 94 static bool realloc_if_full(lazymanifest *self)
95 95 {
96 96 if (self->numlines == self->maxlines) {
97 97 self->maxlines *= 2;
98 98 self->lines = realloc(self->lines, self->maxlines * sizeof(line));
99 99 }
100 100 return !!self->lines;
101 101 }
102 102
103 103 /*
104 104 * Find the line boundaries in the manifest that 'data' points to and store
105 105 * information about each line in 'self'.
106 106 */
107 107 static int find_lines(lazymanifest *self, char *data, Py_ssize_t len)
108 108 {
109 109 char *prev = NULL;
110 110 while (len > 0) {
111 111 line *l;
112 112 char *next = memchr(data, '\n', len);
113 113 if (!next) {
114 114 return MANIFEST_MALFORMED;
115 115 }
116 116 next++; /* advance past newline */
117 117 if (!realloc_if_full(self)) {
118 118 return MANIFEST_OOM; /* no memory */
119 119 }
120 120 if (prev && strcmp(prev, data) > -1) {
121 121 /* This data isn't sorted, so we have to abort. */
122 122 return MANIFEST_NOT_SORTED;
123 123 }
124 124 l = self->lines + ((self->numlines)++);
125 125 l->start = data;
126 126 l->len = next - data;
127 127 l->hash_suffix = '\0';
128 128 l->from_malloc = false;
129 129 l->deleted = false;
130 130 len = len - l->len;
131 131 prev = data;
132 132 data = next;
133 133 }
134 134 self->livelines = self->numlines;
135 135 return 0;
136 136 }
137 137
138 138 static int lazymanifest_init(lazymanifest *self, PyObject *args)
139 139 {
140 140 char *data;
141 141 Py_ssize_t len;
142 142 int err, ret;
143 143 PyObject *pydata;
144 144 if (!PyArg_ParseTuple(args, "S", &pydata)) {
145 145 return -1;
146 146 }
147 147 err = PyString_AsStringAndSize(pydata, &data, &len);
148 148
149 149 self->dirty = false;
150 150 if (err == -1)
151 151 return -1;
152 152 self->pydata = pydata;
153 153 Py_INCREF(self->pydata);
154 154 Py_BEGIN_ALLOW_THREADS
155 155 self->lines = malloc(DEFAULT_LINES * sizeof(line));
156 156 self->maxlines = DEFAULT_LINES;
157 157 self->numlines = 0;
158 158 if (!self->lines)
159 159 ret = MANIFEST_OOM;
160 160 else
161 161 ret = find_lines(self, data, len);
162 162 Py_END_ALLOW_THREADS
163 163 switch (ret) {
164 164 case 0:
165 165 break;
166 166 case MANIFEST_OOM:
167 167 PyErr_NoMemory();
168 168 break;
169 169 case MANIFEST_NOT_SORTED:
170 170 PyErr_Format(PyExc_ValueError,
171 171 "Manifest lines not in sorted order.");
172 172 break;
173 173 case MANIFEST_MALFORMED:
174 174 PyErr_Format(PyExc_ValueError,
175 175 "Manifest did not end in a newline.");
176 176 break;
177 177 default:
178 178 PyErr_Format(PyExc_ValueError,
179 179 "Unknown problem parsing manifest.");
180 180 }
181 181 return ret == 0 ? 0 : -1;
182 182 }
183 183
184 184 static void lazymanifest_dealloc(lazymanifest *self)
185 185 {
186 186 /* free any extra lines we had to allocate */
187 187 int i;
188 188 for (i = 0; i < self->numlines; i++) {
189 189 if (self->lines[i].from_malloc) {
190 190 free(self->lines[i].start);
191 191 }
192 192 }
193 193 if (self->lines) {
194 194 free(self->lines);
195 195 self->lines = NULL;
196 196 }
197 197 if (self->pydata) {
198 198 Py_DECREF(self->pydata);
199 199 self->pydata = NULL;
200 200 }
201 201 PyObject_Del(self);
202 202 }
203 203
204 204 /* iteration support */
205 205
206 206 typedef struct {
207 207 PyObject_HEAD lazymanifest *m;
208 208 Py_ssize_t pos;
209 209 } lmIter;
210 210
211 211 static void lmiter_dealloc(PyObject *o)
212 212 {
213 213 lmIter *self = (lmIter *)o;
214 214 Py_DECREF(self->m);
215 215 PyObject_Del(self);
216 216 }
217 217
218 218 static line *lmiter_nextline(lmIter *self)
219 219 {
220 220 do {
221 221 self->pos++;
222 222 if (self->pos >= self->m->numlines) {
223 223 return NULL;
224 224 }
225 225 /* skip over deleted manifest entries */
226 226 } while (self->m->lines[self->pos].deleted);
227 227 return self->m->lines + self->pos;
228 228 }
229 229
230 230 static PyObject *lmiter_iterentriesnext(PyObject *o)
231 231 {
232 232 size_t pl;
233 233 line *l;
234 234 Py_ssize_t consumed;
235 PyObject *path = NULL, *hash = NULL, *flags = NULL;
235 PyObject *ret = NULL, *path = NULL, *hash = NULL, *flags = NULL;
236 236 l = lmiter_nextline((lmIter *)o);
237 237 if (!l) {
238 238 goto bail;
239 239 }
240 240 pl = pathlen(l);
241 241 path = PyString_FromStringAndSize(l->start, pl);
242 242 hash = nodeof(l);
243 243 consumed = pl + 41;
244 244 flags = PyString_FromStringAndSize(l->start + consumed,
245 245 l->len - consumed - 1);
246 246 if (!path || !hash || !flags) {
247 247 goto bail;
248 248 }
249 return PyTuple_Pack(3, path, hash, flags);
249 ret = PyTuple_Pack(3, path, hash, flags);
250 250 bail:
251 251 Py_XDECREF(path);
252 252 Py_XDECREF(hash);
253 253 Py_XDECREF(flags);
254 return NULL;
254 return ret;
255 255 }
256 256
257 257 static PyTypeObject lazymanifestEntriesIterator = {
258 258 PyObject_HEAD_INIT(NULL)
259 259 0, /*ob_size */
260 260 "parsers.lazymanifest.entriesiterator", /*tp_name */
261 261 sizeof(lmIter), /*tp_basicsize */
262 262 0, /*tp_itemsize */
263 263 lmiter_dealloc, /*tp_dealloc */
264 264 0, /*tp_print */
265 265 0, /*tp_getattr */
266 266 0, /*tp_setattr */
267 267 0, /*tp_compare */
268 268 0, /*tp_repr */
269 269 0, /*tp_as_number */
270 270 0, /*tp_as_sequence */
271 271 0, /*tp_as_mapping */
272 272 0, /*tp_hash */
273 273 0, /*tp_call */
274 274 0, /*tp_str */
275 275 0, /*tp_getattro */
276 276 0, /*tp_setattro */
277 277 0, /*tp_as_buffer */
278 278 /* tp_flags: Py_TPFLAGS_HAVE_ITER tells python to
279 279 use tp_iter and tp_iternext fields. */
280 280 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_ITER,
281 281 "Iterator for 3-tuples in a lazymanifest.", /* tp_doc */
282 282 0, /* tp_traverse */
283 283 0, /* tp_clear */
284 284 0, /* tp_richcompare */
285 285 0, /* tp_weaklistoffset */
286 286 PyObject_SelfIter, /* tp_iter: __iter__() method */
287 287 lmiter_iterentriesnext, /* tp_iternext: next() method */
288 288 };
289 289
290 290 static PyObject *lmiter_iterkeysnext(PyObject *o)
291 291 {
292 292 size_t pl;
293 293 line *l = lmiter_nextline((lmIter *)o);
294 294 if (!l) {
295 295 return NULL;
296 296 }
297 297 pl = pathlen(l);
298 298 return PyString_FromStringAndSize(l->start, pl);
299 299 }
300 300
301 301 static PyTypeObject lazymanifestKeysIterator = {
302 302 PyObject_HEAD_INIT(NULL)
303 303 0, /*ob_size */
304 304 "parsers.lazymanifest.keysiterator", /*tp_name */
305 305 sizeof(lmIter), /*tp_basicsize */
306 306 0, /*tp_itemsize */
307 307 lmiter_dealloc, /*tp_dealloc */
308 308 0, /*tp_print */
309 309 0, /*tp_getattr */
310 310 0, /*tp_setattr */
311 311 0, /*tp_compare */
312 312 0, /*tp_repr */
313 313 0, /*tp_as_number */
314 314 0, /*tp_as_sequence */
315 315 0, /*tp_as_mapping */
316 316 0, /*tp_hash */
317 317 0, /*tp_call */
318 318 0, /*tp_str */
319 319 0, /*tp_getattro */
320 320 0, /*tp_setattro */
321 321 0, /*tp_as_buffer */
322 322 /* tp_flags: Py_TPFLAGS_HAVE_ITER tells python to
323 323 use tp_iter and tp_iternext fields. */
324 324 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_ITER,
325 325 "Keys iterator for a lazymanifest.", /* tp_doc */
326 326 0, /* tp_traverse */
327 327 0, /* tp_clear */
328 328 0, /* tp_richcompare */
329 329 0, /* tp_weaklistoffset */
330 330 PyObject_SelfIter, /* tp_iter: __iter__() method */
331 331 lmiter_iterkeysnext, /* tp_iternext: next() method */
332 332 };
333 333
334 334 static lazymanifest *lazymanifest_copy(lazymanifest *self);
335 335
336 336 static PyObject *lazymanifest_getentriesiter(lazymanifest *self)
337 337 {
338 338 lmIter *i = NULL;
339 339 lazymanifest *t = lazymanifest_copy(self);
340 340 if (!t) {
341 341 PyErr_NoMemory();
342 342 return NULL;
343 343 }
344 344 i = PyObject_New(lmIter, &lazymanifestEntriesIterator);
345 345 if (i) {
346 346 i->m = t;
347 347 i->pos = -1;
348 348 } else {
349 349 Py_DECREF(t);
350 350 PyErr_NoMemory();
351 351 }
352 352 return (PyObject *)i;
353 353 }
354 354
355 355 static PyObject *lazymanifest_getkeysiter(lazymanifest *self)
356 356 {
357 357 lmIter *i = NULL;
358 358 lazymanifest *t = lazymanifest_copy(self);
359 359 if (!t) {
360 360 PyErr_NoMemory();
361 361 return NULL;
362 362 }
363 363 i = PyObject_New(lmIter, &lazymanifestKeysIterator);
364 364 if (i) {
365 365 i->m = t;
366 366 i->pos = -1;
367 367 } else {
368 368 Py_DECREF(t);
369 369 PyErr_NoMemory();
370 370 }
371 371 return (PyObject *)i;
372 372 }
373 373
374 374 /* __getitem__ and __setitem__ support */
375 375
376 376 static Py_ssize_t lazymanifest_size(lazymanifest *self)
377 377 {
378 378 return self->livelines;
379 379 }
380 380
381 381 static int linecmp(const void *left, const void *right)
382 382 {
383 383 return strcmp(((const line *)left)->start,
384 384 ((const line *)right)->start);
385 385 }
386 386
387 387 static PyObject *lazymanifest_getitem(lazymanifest *self, PyObject *key)
388 388 {
389 389 line needle;
390 390 line *hit;
391 391 if (!PyString_Check(key)) {
392 392 PyErr_Format(PyExc_TypeError,
393 393 "getitem: manifest keys must be a string.");
394 394 return NULL;
395 395 }
396 396 needle.start = PyString_AsString(key);
397 397 hit = bsearch(&needle, self->lines, self->numlines, sizeof(line),
398 398 &linecmp);
399 399 if (!hit || hit->deleted) {
400 400 PyErr_Format(PyExc_KeyError, "No such manifest entry.");
401 401 return NULL;
402 402 }
403 403 return hashflags(hit);
404 404 }
405 405
406 406 static int lazymanifest_delitem(lazymanifest *self, PyObject *key)
407 407 {
408 408 line needle;
409 409 line *hit;
410 410 if (!PyString_Check(key)) {
411 411 PyErr_Format(PyExc_TypeError,
412 412 "delitem: manifest keys must be a string.");
413 413 return -1;
414 414 }
415 415 needle.start = PyString_AsString(key);
416 416 hit = bsearch(&needle, self->lines, self->numlines, sizeof(line),
417 417 &linecmp);
418 418 if (!hit || hit->deleted) {
419 419 PyErr_Format(PyExc_KeyError,
420 420 "Tried to delete nonexistent manifest entry.");
421 421 return -1;
422 422 }
423 423 self->dirty = true;
424 424 hit->deleted = true;
425 425 self->livelines--;
426 426 return 0;
427 427 }
428 428
429 429 /* Do a binary search for the insertion point for new, creating the
430 430 * new entry if needed. */
431 431 static int internalsetitem(lazymanifest *self, line *new) {
432 432 int start = 0, end = self->numlines;
433 433 while (start < end) {
434 434 int pos = start + (end - start) / 2;
435 435 int c = linecmp(new, self->lines + pos);
436 436 if (c < 0)
437 437 end = pos;
438 438 else if (c > 0)
439 439 start = pos + 1;
440 440 else {
441 441 if (self->lines[pos].deleted)
442 442 self->livelines++;
443 443 start = pos;
444 444 goto finish;
445 445 }
446 446 }
447 447 /* being here means we need to do an insert */
448 448 if (!realloc_if_full(self)) {
449 449 PyErr_NoMemory();
450 450 return -1;
451 451 }
452 452 memmove(self->lines + start + 1, self->lines + start,
453 453 (self->numlines - start) * sizeof(line));
454 454 self->numlines++;
455 455 self->livelines++;
456 456 finish:
457 457 self->lines[start] = *new;
458 458 self->dirty = true;
459 459 return 0;
460 460 }
461 461
462 462 static int lazymanifest_setitem(
463 463 lazymanifest *self, PyObject *key, PyObject *value)
464 464 {
465 465 char *path;
466 466 Py_ssize_t plen;
467 467 PyObject *pyhash;
468 468 Py_ssize_t hlen;
469 469 char *hash;
470 470 PyObject *pyflags;
471 471 char *flags;
472 472 Py_ssize_t flen;
473 473 size_t dlen;
474 474 char *dest;
475 475 int i;
476 476 line new;
477 477 if (!PyString_Check(key)) {
478 478 PyErr_Format(PyExc_TypeError,
479 479 "setitem: manifest keys must be a string.");
480 480 return -1;
481 481 }
482 482 if (!value) {
483 483 return lazymanifest_delitem(self, key);
484 484 }
485 485 if (!PyTuple_Check(value) || PyTuple_Size(value) != 2) {
486 486 PyErr_Format(PyExc_TypeError,
487 487 "Manifest values must be a tuple of (node, flags).");
488 488 return -1;
489 489 }
490 490 if (PyString_AsStringAndSize(key, &path, &plen) == -1) {
491 491 return -1;
492 492 }
493 493
494 494 pyhash = PyTuple_GetItem(value, 0);
495 495 if (!PyString_Check(pyhash)) {
496 496 PyErr_Format(PyExc_TypeError,
497 497 "node must be a 20-byte string");
498 498 return -1;
499 499 }
500 500 hlen = PyString_Size(pyhash);
501 501 /* Some parts of the codebase try and set 21 or 22
502 502 * byte "hash" values in order to perturb things for
503 503 * status. We have to preserve at least the 21st
504 504 * byte. Sigh. If there's a 22nd byte, we drop it on
505 505 * the floor, which works fine.
506 506 */
507 507 if (hlen != 20 && hlen != 21 && hlen != 22) {
508 508 PyErr_Format(PyExc_TypeError,
509 509 "node must be a 20-byte string");
510 510 return -1;
511 511 }
512 512 hash = PyString_AsString(pyhash);
513 513
514 514 pyflags = PyTuple_GetItem(value, 1);
515 515 if (!PyString_Check(pyflags) || PyString_Size(pyflags) > 1) {
516 516 PyErr_Format(PyExc_TypeError,
517 517 "flags must a 0 or 1 byte string");
518 518 return -1;
519 519 }
520 520 if (PyString_AsStringAndSize(pyflags, &flags, &flen) == -1) {
521 521 return -1;
522 522 }
523 523 /* one null byte and one newline */
524 524 dlen = plen + 41 + flen + 1;
525 525 dest = malloc(dlen);
526 526 if (!dest) {
527 527 PyErr_NoMemory();
528 528 return -1;
529 529 }
530 530 memcpy(dest, path, plen + 1);
531 531 for (i = 0; i < 20; i++) {
532 532 /* Cast to unsigned, so it will not get sign-extended when promoted
533 533 * to int (as is done when passing to a variadic function)
534 534 */
535 535 sprintf(dest + plen + 1 + (i * 2), "%02x", (unsigned char)hash[i]);
536 536 }
537 537 memcpy(dest + plen + 41, flags, flen);
538 538 dest[plen + 41 + flen] = '\n';
539 539 new.start = dest;
540 540 new.len = dlen;
541 541 new.hash_suffix = '\0';
542 542 if (hlen > 20) {
543 543 new.hash_suffix = hash[20];
544 544 }
545 545 new.from_malloc = true; /* is `start` a pointer we allocated? */
546 546 new.deleted = false; /* is this entry deleted? */
547 547 if (internalsetitem(self, &new)) {
548 548 return -1;
549 549 }
550 550 return 0;
551 551 }
552 552
553 553 static PyMappingMethods lazymanifest_mapping_methods = {
554 554 (lenfunc)lazymanifest_size, /* mp_length */
555 555 (binaryfunc)lazymanifest_getitem, /* mp_subscript */
556 556 (objobjargproc)lazymanifest_setitem, /* mp_ass_subscript */
557 557 };
558 558
559 559 /* sequence methods (important or __contains__ builds an iterator */
560 560
561 561 static int lazymanifest_contains(lazymanifest *self, PyObject *key)
562 562 {
563 563 line needle;
564 564 line *hit;
565 565 if (!PyString_Check(key)) {
566 566 /* Our keys are always strings, so if the contains
567 567 * check is for a non-string, just return false. */
568 568 return 0;
569 569 }
570 570 needle.start = PyString_AsString(key);
571 571 hit = bsearch(&needle, self->lines, self->numlines, sizeof(line),
572 572 &linecmp);
573 573 if (!hit || hit->deleted) {
574 574 return 0;
575 575 }
576 576 return 1;
577 577 }
578 578
579 579 static PySequenceMethods lazymanifest_seq_meths = {
580 580 (lenfunc)lazymanifest_size, /* sq_length */
581 581 0, /* sq_concat */
582 582 0, /* sq_repeat */
583 583 0, /* sq_item */
584 584 0, /* sq_slice */
585 585 0, /* sq_ass_item */
586 586 0, /* sq_ass_slice */
587 587 (objobjproc)lazymanifest_contains, /* sq_contains */
588 588 0, /* sq_inplace_concat */
589 589 0, /* sq_inplace_repeat */
590 590 };
591 591
592 592
593 593 /* Other methods (copy, diff, etc) */
594 594 static PyTypeObject lazymanifestType;
595 595
596 596 /* If the manifest has changes, build the new manifest text and reindex it. */
597 597 static int compact(lazymanifest *self) {
598 598 int i;
599 599 ssize_t need = 0;
600 600 char *data;
601 601 line *src, *dst;
602 602 PyObject *pydata;
603 603 if (!self->dirty)
604 604 return 0;
605 605 for (i = 0; i < self->numlines; i++) {
606 606 if (!self->lines[i].deleted) {
607 607 need += self->lines[i].len;
608 608 }
609 609 }
610 610 pydata = PyString_FromStringAndSize(NULL, need);
611 611 if (!pydata)
612 612 return -1;
613 613 data = PyString_AsString(pydata);
614 614 if (!data) {
615 615 return -1;
616 616 }
617 617 src = self->lines;
618 618 dst = self->lines;
619 619 for (i = 0; i < self->numlines; i++, src++) {
620 620 char *tofree = NULL;
621 621 if (src->from_malloc) {
622 622 tofree = src->start;
623 623 }
624 624 if (!src->deleted) {
625 625 memcpy(data, src->start, src->len);
626 626 *dst = *src;
627 627 dst->start = data;
628 628 dst->from_malloc = false;
629 629 data += dst->len;
630 630 dst++;
631 631 }
632 632 free(tofree);
633 633 }
634 634 Py_DECREF(self->pydata);
635 635 self->pydata = pydata;
636 636 self->numlines = self->livelines;
637 637 self->dirty = false;
638 638 return 0;
639 639 }
640 640
641 641 static PyObject *lazymanifest_text(lazymanifest *self)
642 642 {
643 643 if (compact(self) != 0) {
644 644 PyErr_NoMemory();
645 645 return NULL;
646 646 }
647 647 Py_INCREF(self->pydata);
648 648 return self->pydata;
649 649 }
650 650
651 651 static lazymanifest *lazymanifest_copy(lazymanifest *self)
652 652 {
653 653 lazymanifest *copy = NULL;
654 654 if (compact(self) != 0) {
655 655 goto nomem;
656 656 }
657 657 copy = PyObject_New(lazymanifest, &lazymanifestType);
658 658 if (!copy) {
659 659 goto nomem;
660 660 }
661 661 copy->numlines = self->numlines;
662 662 copy->livelines = self->livelines;
663 663 copy->dirty = false;
664 664 copy->lines = malloc(self->maxlines *sizeof(line));
665 665 if (!copy->lines) {
666 666 goto nomem;
667 667 }
668 668 memcpy(copy->lines, self->lines, self->numlines * sizeof(line));
669 669 copy->maxlines = self->maxlines;
670 670 copy->pydata = self->pydata;
671 671 Py_INCREF(copy->pydata);
672 672 return copy;
673 673 nomem:
674 674 PyErr_NoMemory();
675 675 Py_XDECREF(copy);
676 676 return NULL;
677 677 }
678 678
679 679 static lazymanifest *lazymanifest_filtercopy(
680 680 lazymanifest *self, PyObject *matchfn)
681 681 {
682 682 lazymanifest *copy = NULL;
683 683 int i;
684 684 if (!PyCallable_Check(matchfn)) {
685 685 PyErr_SetString(PyExc_TypeError, "matchfn must be callable");
686 686 return NULL;
687 687 }
688 688 /* compact ourselves first to avoid double-frees later when we
689 689 * compact tmp so that it doesn't have random pointers to our
690 690 * underlying from_malloc-data (self->pydata is safe) */
691 691 if (compact(self) != 0) {
692 692 goto nomem;
693 693 }
694 694 copy = PyObject_New(lazymanifest, &lazymanifestType);
695 695 copy->dirty = true;
696 696 copy->lines = malloc(self->maxlines * sizeof(line));
697 697 if (!copy->lines) {
698 698 goto nomem;
699 699 }
700 700 copy->maxlines = self->maxlines;
701 701 copy->numlines = 0;
702 702 copy->pydata = self->pydata;
703 703 Py_INCREF(self->pydata);
704 704 for (i = 0; i < self->numlines; i++) {
705 705 PyObject *arg = PyString_FromString(self->lines[i].start);
706 706 PyObject *arglist = PyTuple_Pack(1, arg);
707 707 PyObject *result = PyObject_CallObject(matchfn, arglist);
708 708 Py_DECREF(arglist);
709 709 Py_DECREF(arg);
710 710 /* if the callback raised an exception, just let it
711 711 * through and give up */
712 712 if (!result) {
713 713 free(copy->lines);
714 714 Py_DECREF(self->pydata);
715 715 return NULL;
716 716 }
717 717 if (PyObject_IsTrue(result)) {
718 718 assert(!(self->lines[i].from_malloc));
719 719 copy->lines[copy->numlines++] = self->lines[i];
720 720 }
721 721 Py_DECREF(result);
722 722 }
723 723 copy->livelines = copy->numlines;
724 724 return copy;
725 725 nomem:
726 726 PyErr_NoMemory();
727 727 Py_XDECREF(copy);
728 728 return NULL;
729 729 }
730 730
731 731 static PyObject *lazymanifest_diff(lazymanifest *self, PyObject *args)
732 732 {
733 733 lazymanifest *other;
734 734 PyObject *pyclean = NULL;
735 735 bool listclean;
736 736 PyObject *emptyTup = NULL, *ret = NULL;
737 737 PyObject *es;
738 738 int sneedle = 0, oneedle = 0;
739 739 if (!PyArg_ParseTuple(args, "O!|O", &lazymanifestType, &other, &pyclean)) {
740 740 return NULL;
741 741 }
742 742 listclean = (!pyclean) ? false : PyObject_IsTrue(pyclean);
743 743 es = PyString_FromString("");
744 744 if (!es) {
745 745 goto nomem;
746 746 }
747 747 emptyTup = PyTuple_Pack(2, Py_None, es);
748 748 Py_DECREF(es);
749 749 if (!emptyTup) {
750 750 goto nomem;
751 751 }
752 752 ret = PyDict_New();
753 753 if (!ret) {
754 754 goto nomem;
755 755 }
756 756 while (sneedle != self->numlines || oneedle != other->numlines) {
757 757 line *left = self->lines + sneedle;
758 758 line *right = other->lines + oneedle;
759 759 int result;
760 760 PyObject *key;
761 761 PyObject *outer;
762 762 /* If we're looking at a deleted entry and it's not
763 763 * the end of the manifest, just skip it. */
764 764 if (left->deleted && sneedle < self->numlines) {
765 765 sneedle++;
766 766 continue;
767 767 }
768 768 if (right->deleted && oneedle < other->numlines) {
769 769 oneedle++;
770 770 continue;
771 771 }
772 772 /* if we're at the end of either manifest, then we
773 773 * know the remaining items are adds so we can skip
774 774 * the strcmp. */
775 775 if (sneedle == self->numlines) {
776 776 result = 1;
777 777 } else if (oneedle == other->numlines) {
778 778 result = -1;
779 779 } else {
780 780 result = linecmp(left, right);
781 781 }
782 782 key = result <= 0 ?
783 783 PyString_FromString(left->start) :
784 784 PyString_FromString(right->start);
785 785 if (!key)
786 786 goto nomem;
787 787 if (result < 0) {
788 788 PyObject *l = hashflags(left);
789 789 if (!l) {
790 790 goto nomem;
791 791 }
792 792 outer = PyTuple_Pack(2, l, emptyTup);
793 793 Py_DECREF(l);
794 794 if (!outer) {
795 795 goto nomem;
796 796 }
797 797 PyDict_SetItem(ret, key, outer);
798 798 Py_DECREF(outer);
799 799 sneedle++;
800 800 } else if (result > 0) {
801 801 PyObject *r = hashflags(right);
802 802 if (!r) {
803 803 goto nomem;
804 804 }
805 805 outer = PyTuple_Pack(2, emptyTup, r);
806 806 Py_DECREF(r);
807 807 if (!outer) {
808 808 goto nomem;
809 809 }
810 810 PyDict_SetItem(ret, key, outer);
811 811 Py_DECREF(outer);
812 812 oneedle++;
813 813 } else {
814 814 /* file exists in both manifests */
815 815 if (left->len != right->len
816 816 || memcmp(left->start, right->start, left->len)
817 817 || left->hash_suffix != right->hash_suffix) {
818 818 PyObject *l = hashflags(left);
819 819 PyObject *r;
820 820 if (!l) {
821 821 goto nomem;
822 822 }
823 823 r = hashflags(right);
824 824 if (!r) {
825 825 Py_DECREF(l);
826 826 goto nomem;
827 827 }
828 828 outer = PyTuple_Pack(2, l, r);
829 829 Py_DECREF(l);
830 830 Py_DECREF(r);
831 831 if (!outer) {
832 832 goto nomem;
833 833 }
834 834 PyDict_SetItem(ret, key, outer);
835 835 Py_DECREF(outer);
836 836 } else if (listclean) {
837 837 PyDict_SetItem(ret, key, Py_None);
838 838 }
839 839 sneedle++;
840 840 oneedle++;
841 841 }
842 842 Py_DECREF(key);
843 843 }
844 844 Py_DECREF(emptyTup);
845 845 return ret;
846 846 nomem:
847 847 PyErr_NoMemory();
848 848 Py_XDECREF(ret);
849 849 Py_XDECREF(emptyTup);
850 850 return NULL;
851 851 }
852 852
853 853 static PyMethodDef lazymanifest_methods[] = {
854 854 {"iterkeys", (PyCFunction)lazymanifest_getkeysiter, METH_NOARGS,
855 855 "Iterate over file names in this lazymanifest."},
856 856 {"iterentries", (PyCFunction)lazymanifest_getentriesiter, METH_NOARGS,
857 857 "Iterate over (path, nodeid, flags) typles in this lazymanifest."},
858 858 {"copy", (PyCFunction)lazymanifest_copy, METH_NOARGS,
859 859 "Make a copy of this lazymanifest."},
860 860 {"filtercopy", (PyCFunction)lazymanifest_filtercopy, METH_O,
861 861 "Make a copy of this manifest filtered by matchfn."},
862 862 {"diff", (PyCFunction)lazymanifest_diff, METH_VARARGS,
863 863 "Compare this lazymanifest to another one."},
864 864 {"text", (PyCFunction)lazymanifest_text, METH_NOARGS,
865 865 "Encode this manifest to text."},
866 866 {NULL},
867 867 };
868 868
869 869 static PyTypeObject lazymanifestType = {
870 870 PyObject_HEAD_INIT(NULL)
871 871 0, /* ob_size */
872 872 "parsers.lazymanifest", /* tp_name */
873 873 sizeof(lazymanifest), /* tp_basicsize */
874 874 0, /* tp_itemsize */
875 875 (destructor)lazymanifest_dealloc, /* tp_dealloc */
876 876 0, /* tp_print */
877 877 0, /* tp_getattr */
878 878 0, /* tp_setattr */
879 879 0, /* tp_compare */
880 880 0, /* tp_repr */
881 881 0, /* tp_as_number */
882 882 &lazymanifest_seq_meths, /* tp_as_sequence */
883 883 &lazymanifest_mapping_methods, /* tp_as_mapping */
884 884 0, /* tp_hash */
885 885 0, /* tp_call */
886 886 0, /* tp_str */
887 887 0, /* tp_getattro */
888 888 0, /* tp_setattro */
889 889 0, /* tp_as_buffer */
890 890 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_SEQUENCE_IN, /* tp_flags */
891 891 "TODO(augie)", /* tp_doc */
892 892 0, /* tp_traverse */
893 893 0, /* tp_clear */
894 894 0, /* tp_richcompare */
895 895 0, /* tp_weaklistoffset */
896 896 (getiterfunc)lazymanifest_getkeysiter, /* tp_iter */
897 897 0, /* tp_iternext */
898 898 lazymanifest_methods, /* tp_methods */
899 899 0, /* tp_members */
900 900 0, /* tp_getset */
901 901 0, /* tp_base */
902 902 0, /* tp_dict */
903 903 0, /* tp_descr_get */
904 904 0, /* tp_descr_set */
905 905 0, /* tp_dictoffset */
906 906 (initproc)lazymanifest_init, /* tp_init */
907 907 0, /* tp_alloc */
908 908 };
909 909
910 910 void manifest_module_init(PyObject * mod)
911 911 {
912 912 lazymanifestType.tp_new = PyType_GenericNew;
913 913 if (PyType_Ready(&lazymanifestType) < 0)
914 914 return;
915 915 Py_INCREF(&lazymanifestType);
916 916
917 917 PyModule_AddObject(mod, "lazymanifest",
918 918 (PyObject *)&lazymanifestType);
919 919 }
General Comments 0
You need to be logged in to leave comments. Login now