##// END OF EJS Templates
lazymanifest: don't crash when out of memory (issue5916)...
Josef 'Jeff' Sipek -
r38321:6caca2a7 stable
parent child Browse files
Show More
@@ -1,940 +1,940 b''
1 1 /*
2 2 * manifest.c - manifest type that does on-demand parsing.
3 3 *
4 4 * Copyright 2015, Google Inc.
5 5 *
6 6 * This software may be used and distributed according to the terms of
7 7 * the GNU General Public License, incorporated herein by reference.
8 8 */
9 9 #include <Python.h>
10 10
11 11 #include <assert.h>
12 12 #include <stdlib.h>
13 13 #include <string.h>
14 14
15 15 #include "charencode.h"
16 16 #include "util.h"
17 17
18 18 #define DEFAULT_LINES 100000
19 19
20 20 typedef struct {
21 21 char *start;
22 22 Py_ssize_t len; /* length of line including terminal newline */
23 23 char hash_suffix;
24 24 bool from_malloc;
25 25 bool deleted;
26 26 } line;
27 27
28 28 typedef struct {
29 29 PyObject_HEAD
30 30 PyObject *pydata;
31 31 line *lines;
32 32 int numlines; /* number of line entries */
33 33 int livelines; /* number of non-deleted lines */
34 34 int maxlines; /* allocated number of lines */
35 35 bool dirty;
36 36 } lazymanifest;
37 37
38 38 #define MANIFEST_OOM -1
39 39 #define MANIFEST_NOT_SORTED -2
40 40 #define MANIFEST_MALFORMED -3
41 41
42 42 /* get the length of the path for a line */
43 43 static size_t pathlen(line *l)
44 44 {
45 45 return strlen(l->start);
46 46 }
47 47
48 48 /* get the node value of a single line */
49 49 static PyObject *nodeof(line *l)
50 50 {
51 51 char *s = l->start;
52 52 ssize_t llen = pathlen(l);
53 53 PyObject *hash = unhexlify(s + llen + 1, 40);
54 54 if (!hash) {
55 55 return NULL;
56 56 }
57 57 if (l->hash_suffix != '\0') {
58 58 char newhash[21];
59 59 memcpy(newhash, PyBytes_AsString(hash), 20);
60 60 Py_DECREF(hash);
61 61 newhash[20] = l->hash_suffix;
62 62 hash = PyBytes_FromStringAndSize(newhash, 21);
63 63 }
64 64 return hash;
65 65 }
66 66
67 67 /* get the node hash and flags of a line as a tuple */
68 68 static PyObject *hashflags(line *l)
69 69 {
70 70 char *s = l->start;
71 71 size_t plen = pathlen(l);
72 72 PyObject *hash = nodeof(l);
73 73
74 74 /* 40 for hash, 1 for null byte, 1 for newline */
75 75 size_t hplen = plen + 42;
76 76 Py_ssize_t flen = l->len - hplen;
77 77 PyObject *flags;
78 78 PyObject *tup;
79 79
80 80 if (!hash)
81 81 return NULL;
82 82 flags = PyBytes_FromStringAndSize(s + hplen - 1, flen);
83 83 if (!flags) {
84 84 Py_DECREF(hash);
85 85 return NULL;
86 86 }
87 87 tup = PyTuple_Pack(2, hash, flags);
88 88 Py_DECREF(flags);
89 89 Py_DECREF(hash);
90 90 return tup;
91 91 }
92 92
93 93 /* if we're about to run out of space in the line index, add more */
94 94 static bool realloc_if_full(lazymanifest *self)
95 95 {
96 96 if (self->numlines == self->maxlines) {
97 97 self->maxlines *= 2;
98 98 self->lines = realloc(self->lines, self->maxlines * sizeof(line));
99 99 }
100 100 return !!self->lines;
101 101 }
102 102
103 103 /*
104 104 * Find the line boundaries in the manifest that 'data' points to and store
105 105 * information about each line in 'self'.
106 106 */
107 107 static int find_lines(lazymanifest *self, char *data, Py_ssize_t len)
108 108 {
109 109 char *prev = NULL;
110 110 while (len > 0) {
111 111 line *l;
112 112 char *next = memchr(data, '\n', len);
113 113 if (!next) {
114 114 return MANIFEST_MALFORMED;
115 115 }
116 116 next++; /* advance past newline */
117 117 if (!realloc_if_full(self)) {
118 118 return MANIFEST_OOM; /* no memory */
119 119 }
120 120 if (prev && strcmp(prev, data) > -1) {
121 121 /* This data isn't sorted, so we have to abort. */
122 122 return MANIFEST_NOT_SORTED;
123 123 }
124 124 l = self->lines + ((self->numlines)++);
125 125 l->start = data;
126 126 l->len = next - data;
127 127 l->hash_suffix = '\0';
128 128 l->from_malloc = false;
129 129 l->deleted = false;
130 130 len = len - l->len;
131 131 prev = data;
132 132 data = next;
133 133 }
134 134 self->livelines = self->numlines;
135 135 return 0;
136 136 }
137 137
138 138 static int lazymanifest_init(lazymanifest *self, PyObject *args)
139 139 {
140 140 char *data;
141 141 Py_ssize_t len;
142 142 int err, ret;
143 143 PyObject *pydata;
144 144 if (!PyArg_ParseTuple(args, "S", &pydata)) {
145 145 return -1;
146 146 }
147 147 err = PyBytes_AsStringAndSize(pydata, &data, &len);
148 148
149 149 self->dirty = false;
150 150 if (err == -1)
151 151 return -1;
152 152 self->pydata = pydata;
153 153 Py_INCREF(self->pydata);
154 154 Py_BEGIN_ALLOW_THREADS
155 155 self->lines = malloc(DEFAULT_LINES * sizeof(line));
156 156 self->maxlines = DEFAULT_LINES;
157 157 self->numlines = 0;
158 158 if (!self->lines)
159 159 ret = MANIFEST_OOM;
160 160 else
161 161 ret = find_lines(self, data, len);
162 162 Py_END_ALLOW_THREADS
163 163 switch (ret) {
164 164 case 0:
165 165 break;
166 166 case MANIFEST_OOM:
167 167 PyErr_NoMemory();
168 168 break;
169 169 case MANIFEST_NOT_SORTED:
170 170 PyErr_Format(PyExc_ValueError,
171 171 "Manifest lines not in sorted order.");
172 172 break;
173 173 case MANIFEST_MALFORMED:
174 174 PyErr_Format(PyExc_ValueError,
175 175 "Manifest did not end in a newline.");
176 176 break;
177 177 default:
178 178 PyErr_Format(PyExc_ValueError,
179 179 "Unknown problem parsing manifest.");
180 180 }
181 181 return ret == 0 ? 0 : -1;
182 182 }
183 183
184 184 static void lazymanifest_dealloc(lazymanifest *self)
185 185 {
186 186 /* free any extra lines we had to allocate */
187 187 int i;
188 for (i = 0; i < self->numlines; i++) {
188 for (i = 0; self->lines && (i < self->numlines); i++) {
189 189 if (self->lines[i].from_malloc) {
190 190 free(self->lines[i].start);
191 191 }
192 192 }
193 193 free(self->lines);
194 194 self->lines = NULL;
195 195 if (self->pydata) {
196 196 Py_DECREF(self->pydata);
197 197 self->pydata = NULL;
198 198 }
199 199 PyObject_Del(self);
200 200 }
201 201
202 202 /* iteration support */
203 203
204 204 typedef struct {
205 205 PyObject_HEAD lazymanifest *m;
206 206 Py_ssize_t pos;
207 207 } lmIter;
208 208
209 209 static void lmiter_dealloc(PyObject *o)
210 210 {
211 211 lmIter *self = (lmIter *)o;
212 212 Py_DECREF(self->m);
213 213 PyObject_Del(self);
214 214 }
215 215
216 216 static line *lmiter_nextline(lmIter *self)
217 217 {
218 218 do {
219 219 self->pos++;
220 220 if (self->pos >= self->m->numlines) {
221 221 return NULL;
222 222 }
223 223 /* skip over deleted manifest entries */
224 224 } while (self->m->lines[self->pos].deleted);
225 225 return self->m->lines + self->pos;
226 226 }
227 227
228 228 static PyObject *lmiter_iterentriesnext(PyObject *o)
229 229 {
230 230 size_t pl;
231 231 line *l;
232 232 Py_ssize_t consumed;
233 233 PyObject *ret = NULL, *path = NULL, *hash = NULL, *flags = NULL;
234 234 l = lmiter_nextline((lmIter *)o);
235 235 if (!l) {
236 236 goto done;
237 237 }
238 238 pl = pathlen(l);
239 239 path = PyBytes_FromStringAndSize(l->start, pl);
240 240 hash = nodeof(l);
241 241 consumed = pl + 41;
242 242 flags = PyBytes_FromStringAndSize(l->start + consumed,
243 243 l->len - consumed - 1);
244 244 if (!path || !hash || !flags) {
245 245 goto done;
246 246 }
247 247 ret = PyTuple_Pack(3, path, hash, flags);
248 248 done:
249 249 Py_XDECREF(path);
250 250 Py_XDECREF(hash);
251 251 Py_XDECREF(flags);
252 252 return ret;
253 253 }
254 254
255 255 #ifdef IS_PY3K
256 256 #define LAZYMANIFESTENTRIESITERATOR_TPFLAGS Py_TPFLAGS_DEFAULT
257 257 #else
258 258 #define LAZYMANIFESTENTRIESITERATOR_TPFLAGS Py_TPFLAGS_DEFAULT \
259 259 | Py_TPFLAGS_HAVE_ITER
260 260 #endif
261 261
262 262 static PyTypeObject lazymanifestEntriesIterator = {
263 263 PyVarObject_HEAD_INIT(NULL, 0) /* header */
264 264 "parsers.lazymanifest.entriesiterator", /*tp_name */
265 265 sizeof(lmIter), /*tp_basicsize */
266 266 0, /*tp_itemsize */
267 267 lmiter_dealloc, /*tp_dealloc */
268 268 0, /*tp_print */
269 269 0, /*tp_getattr */
270 270 0, /*tp_setattr */
271 271 0, /*tp_compare */
272 272 0, /*tp_repr */
273 273 0, /*tp_as_number */
274 274 0, /*tp_as_sequence */
275 275 0, /*tp_as_mapping */
276 276 0, /*tp_hash */
277 277 0, /*tp_call */
278 278 0, /*tp_str */
279 279 0, /*tp_getattro */
280 280 0, /*tp_setattro */
281 281 0, /*tp_as_buffer */
282 282 LAZYMANIFESTENTRIESITERATOR_TPFLAGS, /* tp_flags */
283 283 "Iterator for 3-tuples in a lazymanifest.", /* tp_doc */
284 284 0, /* tp_traverse */
285 285 0, /* tp_clear */
286 286 0, /* tp_richcompare */
287 287 0, /* tp_weaklistoffset */
288 288 PyObject_SelfIter, /* tp_iter: __iter__() method */
289 289 lmiter_iterentriesnext, /* tp_iternext: next() method */
290 290 };
291 291
292 292 static PyObject *lmiter_iterkeysnext(PyObject *o)
293 293 {
294 294 size_t pl;
295 295 line *l = lmiter_nextline((lmIter *)o);
296 296 if (!l) {
297 297 return NULL;
298 298 }
299 299 pl = pathlen(l);
300 300 return PyBytes_FromStringAndSize(l->start, pl);
301 301 }
302 302
303 303 #ifdef IS_PY3K
304 304 #define LAZYMANIFESTKEYSITERATOR_TPFLAGS Py_TPFLAGS_DEFAULT
305 305 #else
306 306 #define LAZYMANIFESTKEYSITERATOR_TPFLAGS Py_TPFLAGS_DEFAULT \
307 307 | Py_TPFLAGS_HAVE_ITER
308 308 #endif
309 309
310 310 static PyTypeObject lazymanifestKeysIterator = {
311 311 PyVarObject_HEAD_INIT(NULL, 0) /* header */
312 312 "parsers.lazymanifest.keysiterator", /*tp_name */
313 313 sizeof(lmIter), /*tp_basicsize */
314 314 0, /*tp_itemsize */
315 315 lmiter_dealloc, /*tp_dealloc */
316 316 0, /*tp_print */
317 317 0, /*tp_getattr */
318 318 0, /*tp_setattr */
319 319 0, /*tp_compare */
320 320 0, /*tp_repr */
321 321 0, /*tp_as_number */
322 322 0, /*tp_as_sequence */
323 323 0, /*tp_as_mapping */
324 324 0, /*tp_hash */
325 325 0, /*tp_call */
326 326 0, /*tp_str */
327 327 0, /*tp_getattro */
328 328 0, /*tp_setattro */
329 329 0, /*tp_as_buffer */
330 330 LAZYMANIFESTKEYSITERATOR_TPFLAGS, /* tp_flags */
331 331 "Keys iterator for a lazymanifest.", /* tp_doc */
332 332 0, /* tp_traverse */
333 333 0, /* tp_clear */
334 334 0, /* tp_richcompare */
335 335 0, /* tp_weaklistoffset */
336 336 PyObject_SelfIter, /* tp_iter: __iter__() method */
337 337 lmiter_iterkeysnext, /* tp_iternext: next() method */
338 338 };
339 339
340 340 static lazymanifest *lazymanifest_copy(lazymanifest *self);
341 341
342 342 static PyObject *lazymanifest_getentriesiter(lazymanifest *self)
343 343 {
344 344 lmIter *i = NULL;
345 345 lazymanifest *t = lazymanifest_copy(self);
346 346 if (!t) {
347 347 PyErr_NoMemory();
348 348 return NULL;
349 349 }
350 350 i = PyObject_New(lmIter, &lazymanifestEntriesIterator);
351 351 if (i) {
352 352 i->m = t;
353 353 i->pos = -1;
354 354 } else {
355 355 Py_DECREF(t);
356 356 PyErr_NoMemory();
357 357 }
358 358 return (PyObject *)i;
359 359 }
360 360
361 361 static PyObject *lazymanifest_getkeysiter(lazymanifest *self)
362 362 {
363 363 lmIter *i = NULL;
364 364 lazymanifest *t = lazymanifest_copy(self);
365 365 if (!t) {
366 366 PyErr_NoMemory();
367 367 return NULL;
368 368 }
369 369 i = PyObject_New(lmIter, &lazymanifestKeysIterator);
370 370 if (i) {
371 371 i->m = t;
372 372 i->pos = -1;
373 373 } else {
374 374 Py_DECREF(t);
375 375 PyErr_NoMemory();
376 376 }
377 377 return (PyObject *)i;
378 378 }
379 379
380 380 /* __getitem__ and __setitem__ support */
381 381
382 382 static Py_ssize_t lazymanifest_size(lazymanifest *self)
383 383 {
384 384 return self->livelines;
385 385 }
386 386
387 387 static int linecmp(const void *left, const void *right)
388 388 {
389 389 return strcmp(((const line *)left)->start,
390 390 ((const line *)right)->start);
391 391 }
392 392
393 393 static PyObject *lazymanifest_getitem(lazymanifest *self, PyObject *key)
394 394 {
395 395 line needle;
396 396 line *hit;
397 397 if (!PyBytes_Check(key)) {
398 398 PyErr_Format(PyExc_TypeError,
399 399 "getitem: manifest keys must be a string.");
400 400 return NULL;
401 401 }
402 402 needle.start = PyBytes_AsString(key);
403 403 hit = bsearch(&needle, self->lines, self->numlines, sizeof(line),
404 404 &linecmp);
405 405 if (!hit || hit->deleted) {
406 406 PyErr_Format(PyExc_KeyError, "No such manifest entry.");
407 407 return NULL;
408 408 }
409 409 return hashflags(hit);
410 410 }
411 411
412 412 static int lazymanifest_delitem(lazymanifest *self, PyObject *key)
413 413 {
414 414 line needle;
415 415 line *hit;
416 416 if (!PyBytes_Check(key)) {
417 417 PyErr_Format(PyExc_TypeError,
418 418 "delitem: manifest keys must be a string.");
419 419 return -1;
420 420 }
421 421 needle.start = PyBytes_AsString(key);
422 422 hit = bsearch(&needle, self->lines, self->numlines, sizeof(line),
423 423 &linecmp);
424 424 if (!hit || hit->deleted) {
425 425 PyErr_Format(PyExc_KeyError,
426 426 "Tried to delete nonexistent manifest entry.");
427 427 return -1;
428 428 }
429 429 self->dirty = true;
430 430 hit->deleted = true;
431 431 self->livelines--;
432 432 return 0;
433 433 }
434 434
435 435 /* Do a binary search for the insertion point for new, creating the
436 436 * new entry if needed. */
437 437 static int internalsetitem(lazymanifest *self, line *new)
438 438 {
439 439 int start = 0, end = self->numlines;
440 440 while (start < end) {
441 441 int pos = start + (end - start) / 2;
442 442 int c = linecmp(new, self->lines + pos);
443 443 if (c < 0)
444 444 end = pos;
445 445 else if (c > 0)
446 446 start = pos + 1;
447 447 else {
448 448 if (self->lines[pos].deleted)
449 449 self->livelines++;
450 450 if (self->lines[pos].from_malloc)
451 451 free(self->lines[pos].start);
452 452 start = pos;
453 453 goto finish;
454 454 }
455 455 }
456 456 /* being here means we need to do an insert */
457 457 if (!realloc_if_full(self)) {
458 458 PyErr_NoMemory();
459 459 return -1;
460 460 }
461 461 memmove(self->lines + start + 1, self->lines + start,
462 462 (self->numlines - start) * sizeof(line));
463 463 self->numlines++;
464 464 self->livelines++;
465 465 finish:
466 466 self->lines[start] = *new;
467 467 self->dirty = true;
468 468 return 0;
469 469 }
470 470
471 471 static int lazymanifest_setitem(
472 472 lazymanifest *self, PyObject *key, PyObject *value)
473 473 {
474 474 char *path;
475 475 Py_ssize_t plen;
476 476 PyObject *pyhash;
477 477 Py_ssize_t hlen;
478 478 char *hash;
479 479 PyObject *pyflags;
480 480 char *flags;
481 481 Py_ssize_t flen;
482 482 size_t dlen;
483 483 char *dest;
484 484 int i;
485 485 line new;
486 486 if (!PyBytes_Check(key)) {
487 487 PyErr_Format(PyExc_TypeError,
488 488 "setitem: manifest keys must be a string.");
489 489 return -1;
490 490 }
491 491 if (!value) {
492 492 return lazymanifest_delitem(self, key);
493 493 }
494 494 if (!PyTuple_Check(value) || PyTuple_Size(value) != 2) {
495 495 PyErr_Format(PyExc_TypeError,
496 496 "Manifest values must be a tuple of (node, flags).");
497 497 return -1;
498 498 }
499 499 if (PyBytes_AsStringAndSize(key, &path, &plen) == -1) {
500 500 return -1;
501 501 }
502 502
503 503 pyhash = PyTuple_GetItem(value, 0);
504 504 if (!PyBytes_Check(pyhash)) {
505 505 PyErr_Format(PyExc_TypeError,
506 506 "node must be a 20-byte string");
507 507 return -1;
508 508 }
509 509 hlen = PyBytes_Size(pyhash);
510 510 /* Some parts of the codebase try and set 21 or 22
511 511 * byte "hash" values in order to perturb things for
512 512 * status. We have to preserve at least the 21st
513 513 * byte. Sigh. If there's a 22nd byte, we drop it on
514 514 * the floor, which works fine.
515 515 */
516 516 if (hlen != 20 && hlen != 21 && hlen != 22) {
517 517 PyErr_Format(PyExc_TypeError,
518 518 "node must be a 20-byte string");
519 519 return -1;
520 520 }
521 521 hash = PyBytes_AsString(pyhash);
522 522
523 523 pyflags = PyTuple_GetItem(value, 1);
524 524 if (!PyBytes_Check(pyflags) || PyBytes_Size(pyflags) > 1) {
525 525 PyErr_Format(PyExc_TypeError,
526 526 "flags must a 0 or 1 byte string");
527 527 return -1;
528 528 }
529 529 if (PyBytes_AsStringAndSize(pyflags, &flags, &flen) == -1) {
530 530 return -1;
531 531 }
532 532 /* one null byte and one newline */
533 533 dlen = plen + 41 + flen + 1;
534 534 dest = malloc(dlen);
535 535 if (!dest) {
536 536 PyErr_NoMemory();
537 537 return -1;
538 538 }
539 539 memcpy(dest, path, plen + 1);
540 540 for (i = 0; i < 20; i++) {
541 541 /* Cast to unsigned, so it will not get sign-extended when promoted
542 542 * to int (as is done when passing to a variadic function)
543 543 */
544 544 sprintf(dest + plen + 1 + (i * 2), "%02x", (unsigned char)hash[i]);
545 545 }
546 546 memcpy(dest + plen + 41, flags, flen);
547 547 dest[plen + 41 + flen] = '\n';
548 548 new.start = dest;
549 549 new.len = dlen;
550 550 new.hash_suffix = '\0';
551 551 if (hlen > 20) {
552 552 new.hash_suffix = hash[20];
553 553 }
554 554 new.from_malloc = true; /* is `start` a pointer we allocated? */
555 555 new.deleted = false; /* is this entry deleted? */
556 556 if (internalsetitem(self, &new)) {
557 557 return -1;
558 558 }
559 559 return 0;
560 560 }
561 561
562 562 static PyMappingMethods lazymanifest_mapping_methods = {
563 563 (lenfunc)lazymanifest_size, /* mp_length */
564 564 (binaryfunc)lazymanifest_getitem, /* mp_subscript */
565 565 (objobjargproc)lazymanifest_setitem, /* mp_ass_subscript */
566 566 };
567 567
568 568 /* sequence methods (important or __contains__ builds an iterator) */
569 569
570 570 static int lazymanifest_contains(lazymanifest *self, PyObject *key)
571 571 {
572 572 line needle;
573 573 line *hit;
574 574 if (!PyBytes_Check(key)) {
575 575 /* Our keys are always strings, so if the contains
576 576 * check is for a non-string, just return false. */
577 577 return 0;
578 578 }
579 579 needle.start = PyBytes_AsString(key);
580 580 hit = bsearch(&needle, self->lines, self->numlines, sizeof(line),
581 581 &linecmp);
582 582 if (!hit || hit->deleted) {
583 583 return 0;
584 584 }
585 585 return 1;
586 586 }
587 587
588 588 static PySequenceMethods lazymanifest_seq_meths = {
589 589 (lenfunc)lazymanifest_size, /* sq_length */
590 590 0, /* sq_concat */
591 591 0, /* sq_repeat */
592 592 0, /* sq_item */
593 593 0, /* sq_slice */
594 594 0, /* sq_ass_item */
595 595 0, /* sq_ass_slice */
596 596 (objobjproc)lazymanifest_contains, /* sq_contains */
597 597 0, /* sq_inplace_concat */
598 598 0, /* sq_inplace_repeat */
599 599 };
600 600
601 601
602 602 /* Other methods (copy, diff, etc) */
603 603 static PyTypeObject lazymanifestType;
604 604
605 605 /* If the manifest has changes, build the new manifest text and reindex it. */
606 606 static int compact(lazymanifest *self)
607 607 {
608 608 int i;
609 609 ssize_t need = 0;
610 610 char *data;
611 611 line *src, *dst;
612 612 PyObject *pydata;
613 613 if (!self->dirty)
614 614 return 0;
615 615 for (i = 0; i < self->numlines; i++) {
616 616 if (!self->lines[i].deleted) {
617 617 need += self->lines[i].len;
618 618 }
619 619 }
620 620 pydata = PyBytes_FromStringAndSize(NULL, need);
621 621 if (!pydata)
622 622 return -1;
623 623 data = PyBytes_AsString(pydata);
624 624 if (!data) {
625 625 return -1;
626 626 }
627 627 src = self->lines;
628 628 dst = self->lines;
629 629 for (i = 0; i < self->numlines; i++, src++) {
630 630 char *tofree = NULL;
631 631 if (src->from_malloc) {
632 632 tofree = src->start;
633 633 }
634 634 if (!src->deleted) {
635 635 memcpy(data, src->start, src->len);
636 636 *dst = *src;
637 637 dst->start = data;
638 638 dst->from_malloc = false;
639 639 data += dst->len;
640 640 dst++;
641 641 }
642 642 free(tofree);
643 643 }
644 644 Py_DECREF(self->pydata);
645 645 self->pydata = pydata;
646 646 self->numlines = self->livelines;
647 647 self->dirty = false;
648 648 return 0;
649 649 }
650 650
651 651 static PyObject *lazymanifest_text(lazymanifest *self)
652 652 {
653 653 if (compact(self) != 0) {
654 654 PyErr_NoMemory();
655 655 return NULL;
656 656 }
657 657 Py_INCREF(self->pydata);
658 658 return self->pydata;
659 659 }
660 660
661 661 static lazymanifest *lazymanifest_copy(lazymanifest *self)
662 662 {
663 663 lazymanifest *copy = NULL;
664 664 if (compact(self) != 0) {
665 665 goto nomem;
666 666 }
667 667 copy = PyObject_New(lazymanifest, &lazymanifestType);
668 668 if (!copy) {
669 669 goto nomem;
670 670 }
671 671 copy->numlines = self->numlines;
672 672 copy->livelines = self->livelines;
673 673 copy->dirty = false;
674 674 copy->lines = malloc(self->maxlines *sizeof(line));
675 675 if (!copy->lines) {
676 676 goto nomem;
677 677 }
678 678 memcpy(copy->lines, self->lines, self->numlines * sizeof(line));
679 679 copy->maxlines = self->maxlines;
680 680 copy->pydata = self->pydata;
681 681 Py_INCREF(copy->pydata);
682 682 return copy;
683 683 nomem:
684 684 PyErr_NoMemory();
685 685 Py_XDECREF(copy);
686 686 return NULL;
687 687 }
688 688
689 689 static lazymanifest *lazymanifest_filtercopy(
690 690 lazymanifest *self, PyObject *matchfn)
691 691 {
692 692 lazymanifest *copy = NULL;
693 693 int i;
694 694 if (!PyCallable_Check(matchfn)) {
695 695 PyErr_SetString(PyExc_TypeError, "matchfn must be callable");
696 696 return NULL;
697 697 }
698 698 /* compact ourselves first to avoid double-frees later when we
699 699 * compact tmp so that it doesn't have random pointers to our
700 700 * underlying from_malloc-data (self->pydata is safe) */
701 701 if (compact(self) != 0) {
702 702 goto nomem;
703 703 }
704 704 copy = PyObject_New(lazymanifest, &lazymanifestType);
705 705 if (!copy) {
706 706 goto nomem;
707 707 }
708 708 copy->dirty = true;
709 709 copy->lines = malloc(self->maxlines * sizeof(line));
710 710 if (!copy->lines) {
711 711 goto nomem;
712 712 }
713 713 copy->maxlines = self->maxlines;
714 714 copy->numlines = 0;
715 715 copy->pydata = self->pydata;
716 716 Py_INCREF(self->pydata);
717 717 for (i = 0; i < self->numlines; i++) {
718 718 PyObject *arglist = NULL, *result = NULL;
719 719 arglist = Py_BuildValue(PY23("(s)", "(y)"),
720 720 self->lines[i].start);
721 721 if (!arglist) {
722 722 return NULL;
723 723 }
724 724 result = PyObject_CallObject(matchfn, arglist);
725 725 Py_DECREF(arglist);
726 726 /* if the callback raised an exception, just let it
727 727 * through and give up */
728 728 if (!result) {
729 729 free(copy->lines);
730 730 Py_DECREF(self->pydata);
731 731 return NULL;
732 732 }
733 733 if (PyObject_IsTrue(result)) {
734 734 assert(!(self->lines[i].from_malloc));
735 735 copy->lines[copy->numlines++] = self->lines[i];
736 736 }
737 737 Py_DECREF(result);
738 738 }
739 739 copy->livelines = copy->numlines;
740 740 return copy;
741 741 nomem:
742 742 PyErr_NoMemory();
743 743 Py_XDECREF(copy);
744 744 return NULL;
745 745 }
746 746
747 747 static PyObject *lazymanifest_diff(lazymanifest *self, PyObject *args)
748 748 {
749 749 lazymanifest *other;
750 750 PyObject *pyclean = NULL;
751 751 bool listclean;
752 752 PyObject *emptyTup = NULL, *ret = NULL;
753 753 PyObject *es;
754 754 int sneedle = 0, oneedle = 0;
755 755 if (!PyArg_ParseTuple(args, "O!|O", &lazymanifestType, &other, &pyclean)) {
756 756 return NULL;
757 757 }
758 758 listclean = (!pyclean) ? false : PyObject_IsTrue(pyclean);
759 759 es = PyBytes_FromString("");
760 760 if (!es) {
761 761 goto nomem;
762 762 }
763 763 emptyTup = PyTuple_Pack(2, Py_None, es);
764 764 Py_DECREF(es);
765 765 if (!emptyTup) {
766 766 goto nomem;
767 767 }
768 768 ret = PyDict_New();
769 769 if (!ret) {
770 770 goto nomem;
771 771 }
772 772 while (sneedle != self->numlines || oneedle != other->numlines) {
773 773 line *left = self->lines + sneedle;
774 774 line *right = other->lines + oneedle;
775 775 int result;
776 776 PyObject *key;
777 777 PyObject *outer;
778 778 /* If we're looking at a deleted entry and it's not
779 779 * the end of the manifest, just skip it. */
780 780 if (sneedle < self->numlines && left->deleted) {
781 781 sneedle++;
782 782 continue;
783 783 }
784 784 if (oneedle < other->numlines && right->deleted) {
785 785 oneedle++;
786 786 continue;
787 787 }
788 788 /* if we're at the end of either manifest, then we
789 789 * know the remaining items are adds so we can skip
790 790 * the strcmp. */
791 791 if (sneedle == self->numlines) {
792 792 result = 1;
793 793 } else if (oneedle == other->numlines) {
794 794 result = -1;
795 795 } else {
796 796 result = linecmp(left, right);
797 797 }
798 798 key = result <= 0 ?
799 799 PyBytes_FromString(left->start) :
800 800 PyBytes_FromString(right->start);
801 801 if (!key)
802 802 goto nomem;
803 803 if (result < 0) {
804 804 PyObject *l = hashflags(left);
805 805 if (!l) {
806 806 goto nomem;
807 807 }
808 808 outer = PyTuple_Pack(2, l, emptyTup);
809 809 Py_DECREF(l);
810 810 if (!outer) {
811 811 goto nomem;
812 812 }
813 813 PyDict_SetItem(ret, key, outer);
814 814 Py_DECREF(outer);
815 815 sneedle++;
816 816 } else if (result > 0) {
817 817 PyObject *r = hashflags(right);
818 818 if (!r) {
819 819 goto nomem;
820 820 }
821 821 outer = PyTuple_Pack(2, emptyTup, r);
822 822 Py_DECREF(r);
823 823 if (!outer) {
824 824 goto nomem;
825 825 }
826 826 PyDict_SetItem(ret, key, outer);
827 827 Py_DECREF(outer);
828 828 oneedle++;
829 829 } else {
830 830 /* file exists in both manifests */
831 831 if (left->len != right->len
832 832 || memcmp(left->start, right->start, left->len)
833 833 || left->hash_suffix != right->hash_suffix) {
834 834 PyObject *l = hashflags(left);
835 835 PyObject *r;
836 836 if (!l) {
837 837 goto nomem;
838 838 }
839 839 r = hashflags(right);
840 840 if (!r) {
841 841 Py_DECREF(l);
842 842 goto nomem;
843 843 }
844 844 outer = PyTuple_Pack(2, l, r);
845 845 Py_DECREF(l);
846 846 Py_DECREF(r);
847 847 if (!outer) {
848 848 goto nomem;
849 849 }
850 850 PyDict_SetItem(ret, key, outer);
851 851 Py_DECREF(outer);
852 852 } else if (listclean) {
853 853 PyDict_SetItem(ret, key, Py_None);
854 854 }
855 855 sneedle++;
856 856 oneedle++;
857 857 }
858 858 Py_DECREF(key);
859 859 }
860 860 Py_DECREF(emptyTup);
861 861 return ret;
862 862 nomem:
863 863 PyErr_NoMemory();
864 864 Py_XDECREF(ret);
865 865 Py_XDECREF(emptyTup);
866 866 return NULL;
867 867 }
868 868
869 869 static PyMethodDef lazymanifest_methods[] = {
870 870 {"iterkeys", (PyCFunction)lazymanifest_getkeysiter, METH_NOARGS,
871 871 "Iterate over file names in this lazymanifest."},
872 872 {"iterentries", (PyCFunction)lazymanifest_getentriesiter, METH_NOARGS,
873 873 "Iterate over (path, nodeid, flags) tuples in this lazymanifest."},
874 874 {"copy", (PyCFunction)lazymanifest_copy, METH_NOARGS,
875 875 "Make a copy of this lazymanifest."},
876 876 {"filtercopy", (PyCFunction)lazymanifest_filtercopy, METH_O,
877 877 "Make a copy of this manifest filtered by matchfn."},
878 878 {"diff", (PyCFunction)lazymanifest_diff, METH_VARARGS,
879 879 "Compare this lazymanifest to another one."},
880 880 {"text", (PyCFunction)lazymanifest_text, METH_NOARGS,
881 881 "Encode this manifest to text."},
882 882 {NULL},
883 883 };
884 884
885 885 #ifdef IS_PY3K
886 886 #define LAZYMANIFEST_TPFLAGS Py_TPFLAGS_DEFAULT
887 887 #else
888 888 #define LAZYMANIFEST_TPFLAGS Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_SEQUENCE_IN
889 889 #endif
890 890
891 891 static PyTypeObject lazymanifestType = {
892 892 PyVarObject_HEAD_INIT(NULL, 0) /* header */
893 893 "parsers.lazymanifest", /* tp_name */
894 894 sizeof(lazymanifest), /* tp_basicsize */
895 895 0, /* tp_itemsize */
896 896 (destructor)lazymanifest_dealloc, /* tp_dealloc */
897 897 0, /* tp_print */
898 898 0, /* tp_getattr */
899 899 0, /* tp_setattr */
900 900 0, /* tp_compare */
901 901 0, /* tp_repr */
902 902 0, /* tp_as_number */
903 903 &lazymanifest_seq_meths, /* tp_as_sequence */
904 904 &lazymanifest_mapping_methods, /* tp_as_mapping */
905 905 0, /* tp_hash */
906 906 0, /* tp_call */
907 907 0, /* tp_str */
908 908 0, /* tp_getattro */
909 909 0, /* tp_setattro */
910 910 0, /* tp_as_buffer */
911 911 LAZYMANIFEST_TPFLAGS, /* tp_flags */
912 912 "TODO(augie)", /* tp_doc */
913 913 0, /* tp_traverse */
914 914 0, /* tp_clear */
915 915 0, /* tp_richcompare */
916 916 0, /* tp_weaklistoffset */
917 917 (getiterfunc)lazymanifest_getkeysiter, /* tp_iter */
918 918 0, /* tp_iternext */
919 919 lazymanifest_methods, /* tp_methods */
920 920 0, /* tp_members */
921 921 0, /* tp_getset */
922 922 0, /* tp_base */
923 923 0, /* tp_dict */
924 924 0, /* tp_descr_get */
925 925 0, /* tp_descr_set */
926 926 0, /* tp_dictoffset */
927 927 (initproc)lazymanifest_init, /* tp_init */
928 928 0, /* tp_alloc */
929 929 };
930 930
931 931 void manifest_module_init(PyObject * mod)
932 932 {
933 933 lazymanifestType.tp_new = PyType_GenericNew;
934 934 if (PyType_Ready(&lazymanifestType) < 0)
935 935 return;
936 936 Py_INCREF(&lazymanifestType);
937 937
938 938 PyModule_AddObject(mod, "lazymanifest",
939 939 (PyObject *)&lazymanifestType);
940 940 }
General Comments 0
You need to be logged in to leave comments. Login now