##// END OF EJS Templates
Merge
Bryan O'Sullivan -
r20111:9bfa8674 merge default
parent child Browse files
Show More
@@ -1,1961 +1,1965
1 /*
1 /*
2 parsers.c - efficient content parsing
2 parsers.c - efficient content parsing
3
3
4 Copyright 2008 Matt Mackall <mpm@selenic.com> and others
4 Copyright 2008 Matt Mackall <mpm@selenic.com> and others
5
5
6 This software may be used and distributed according to the terms of
6 This software may be used and distributed according to the terms of
7 the GNU General Public License, incorporated herein by reference.
7 the GNU General Public License, incorporated herein by reference.
8 */
8 */
9
9
10 #include <Python.h>
10 #include <Python.h>
11 #include <ctype.h>
11 #include <ctype.h>
12 #include <stddef.h>
12 #include <stddef.h>
13 #include <string.h>
13 #include <string.h>
14
14
15 #include "util.h"
15 #include "util.h"
16
16
17 static int8_t hextable[256] = {
17 static int8_t hextable[256] = {
18 -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
18 -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
19 -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
19 -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
20 -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
20 -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
21 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, -1, -1, -1, -1, -1, -1, /* 0-9 */
21 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, -1, -1, -1, -1, -1, -1, /* 0-9 */
22 -1, 10, 11, 12, 13, 14, 15, -1, -1, -1, -1, -1, -1, -1, -1, -1, /* A-F */
22 -1, 10, 11, 12, 13, 14, 15, -1, -1, -1, -1, -1, -1, -1, -1, -1, /* A-F */
23 -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
23 -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
24 -1, 10, 11, 12, 13, 14, 15, -1, -1, -1, -1, -1, -1, -1, -1, -1, /* a-f */
24 -1, 10, 11, 12, 13, 14, 15, -1, -1, -1, -1, -1, -1, -1, -1, -1, /* a-f */
25 -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
25 -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
26 -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
26 -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
27 -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
27 -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
28 -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
28 -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
29 -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
29 -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
30 -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
30 -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
31 -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
31 -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
32 -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
32 -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
33 -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1
33 -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1
34 };
34 };
35
35
36 static inline int hexdigit(const char *p, Py_ssize_t off)
36 static inline int hexdigit(const char *p, Py_ssize_t off)
37 {
37 {
38 int8_t val = hextable[(unsigned char)p[off]];
38 int8_t val = hextable[(unsigned char)p[off]];
39
39
40 if (val >= 0) {
40 if (val >= 0) {
41 return val;
41 return val;
42 }
42 }
43
43
44 PyErr_SetString(PyExc_ValueError, "input contains non-hex character");
44 PyErr_SetString(PyExc_ValueError, "input contains non-hex character");
45 return 0;
45 return 0;
46 }
46 }
47
47
48 /*
48 /*
49 * Turn a hex-encoded string into binary.
49 * Turn a hex-encoded string into binary.
50 */
50 */
51 static PyObject *unhexlify(const char *str, int len)
51 static PyObject *unhexlify(const char *str, int len)
52 {
52 {
53 PyObject *ret;
53 PyObject *ret;
54 char *d;
54 char *d;
55 int i;
55 int i;
56
56
57 ret = PyBytes_FromStringAndSize(NULL, len / 2);
57 ret = PyBytes_FromStringAndSize(NULL, len / 2);
58
58
59 if (!ret)
59 if (!ret)
60 return NULL;
60 return NULL;
61
61
62 d = PyBytes_AsString(ret);
62 d = PyBytes_AsString(ret);
63
63
64 for (i = 0; i < len;) {
64 for (i = 0; i < len;) {
65 int hi = hexdigit(str, i++);
65 int hi = hexdigit(str, i++);
66 int lo = hexdigit(str, i++);
66 int lo = hexdigit(str, i++);
67 *d++ = (hi << 4) | lo;
67 *d++ = (hi << 4) | lo;
68 }
68 }
69
69
70 return ret;
70 return ret;
71 }
71 }
72
72
73 /*
73 /*
74 * This code assumes that a manifest is stitched together with newline
74 * This code assumes that a manifest is stitched together with newline
75 * ('\n') characters.
75 * ('\n') characters.
76 */
76 */
77 static PyObject *parse_manifest(PyObject *self, PyObject *args)
77 static PyObject *parse_manifest(PyObject *self, PyObject *args)
78 {
78 {
79 PyObject *mfdict, *fdict;
79 PyObject *mfdict, *fdict;
80 char *str, *start, *end;
80 char *str, *start, *end;
81 int len;
81 int len;
82
82
83 if (!PyArg_ParseTuple(args, "O!O!s#:parse_manifest",
83 if (!PyArg_ParseTuple(args, "O!O!s#:parse_manifest",
84 &PyDict_Type, &mfdict,
84 &PyDict_Type, &mfdict,
85 &PyDict_Type, &fdict,
85 &PyDict_Type, &fdict,
86 &str, &len))
86 &str, &len))
87 goto quit;
87 goto quit;
88
88
89 start = str;
89 start = str;
90 end = str + len;
90 end = str + len;
91 while (start < end) {
91 while (start < end) {
92 PyObject *file = NULL, *node = NULL;
92 PyObject *file = NULL, *node = NULL;
93 PyObject *flags = NULL;
93 PyObject *flags = NULL;
94 char *zero = NULL, *newline = NULL;
94 char *zero = NULL, *newline = NULL;
95 ptrdiff_t nlen;
95 ptrdiff_t nlen;
96
96
97 zero = memchr(start, '\0', end - start);
97 zero = memchr(start, '\0', end - start);
98 if (!zero) {
98 if (!zero) {
99 PyErr_SetString(PyExc_ValueError,
99 PyErr_SetString(PyExc_ValueError,
100 "manifest entry has no separator");
100 "manifest entry has no separator");
101 goto quit;
101 goto quit;
102 }
102 }
103
103
104 newline = memchr(zero + 1, '\n', end - (zero + 1));
104 newline = memchr(zero + 1, '\n', end - (zero + 1));
105 if (!newline) {
105 if (!newline) {
106 PyErr_SetString(PyExc_ValueError,
106 PyErr_SetString(PyExc_ValueError,
107 "manifest contains trailing garbage");
107 "manifest contains trailing garbage");
108 goto quit;
108 goto quit;
109 }
109 }
110
110
111 file = PyBytes_FromStringAndSize(start, zero - start);
111 file = PyBytes_FromStringAndSize(start, zero - start);
112
112
113 if (!file)
113 if (!file)
114 goto bail;
114 goto bail;
115
115
116 nlen = newline - zero - 1;
116 nlen = newline - zero - 1;
117
117
118 node = unhexlify(zero + 1, nlen > 40 ? 40 : (int)nlen);
118 node = unhexlify(zero + 1, nlen > 40 ? 40 : (int)nlen);
119 if (!node)
119 if (!node)
120 goto bail;
120 goto bail;
121
121
122 if (nlen > 40) {
122 if (nlen > 40) {
123 flags = PyBytes_FromStringAndSize(zero + 41,
123 flags = PyBytes_FromStringAndSize(zero + 41,
124 nlen - 40);
124 nlen - 40);
125 if (!flags)
125 if (!flags)
126 goto bail;
126 goto bail;
127
127
128 if (PyDict_SetItem(fdict, file, flags) == -1)
128 if (PyDict_SetItem(fdict, file, flags) == -1)
129 goto bail;
129 goto bail;
130 }
130 }
131
131
132 if (PyDict_SetItem(mfdict, file, node) == -1)
132 if (PyDict_SetItem(mfdict, file, node) == -1)
133 goto bail;
133 goto bail;
134
134
135 start = newline + 1;
135 start = newline + 1;
136
136
137 Py_XDECREF(flags);
137 Py_XDECREF(flags);
138 Py_XDECREF(node);
138 Py_XDECREF(node);
139 Py_XDECREF(file);
139 Py_XDECREF(file);
140 continue;
140 continue;
141 bail:
141 bail:
142 Py_XDECREF(flags);
142 Py_XDECREF(flags);
143 Py_XDECREF(node);
143 Py_XDECREF(node);
144 Py_XDECREF(file);
144 Py_XDECREF(file);
145 goto quit;
145 goto quit;
146 }
146 }
147
147
148 Py_INCREF(Py_None);
148 Py_INCREF(Py_None);
149 return Py_None;
149 return Py_None;
150 quit:
150 quit:
151 return NULL;
151 return NULL;
152 }
152 }
153
153
154 static PyObject *parse_dirstate(PyObject *self, PyObject *args)
154 static PyObject *parse_dirstate(PyObject *self, PyObject *args)
155 {
155 {
156 PyObject *dmap, *cmap, *parents = NULL, *ret = NULL;
156 PyObject *dmap, *cmap, *parents = NULL, *ret = NULL;
157 PyObject *fname = NULL, *cname = NULL, *entry = NULL;
157 PyObject *fname = NULL, *cname = NULL, *entry = NULL;
158 char state, *str, *cur, *end, *cpos;
158 char state, *str, *cur, *end, *cpos;
159 int mode, size, mtime;
159 int mode, size, mtime;
160 unsigned int flen;
160 unsigned int flen;
161 int len;
161 int len;
162
162
163 if (!PyArg_ParseTuple(args, "O!O!s#:parse_dirstate",
163 if (!PyArg_ParseTuple(args, "O!O!s#:parse_dirstate",
164 &PyDict_Type, &dmap,
164 &PyDict_Type, &dmap,
165 &PyDict_Type, &cmap,
165 &PyDict_Type, &cmap,
166 &str, &len))
166 &str, &len))
167 goto quit;
167 goto quit;
168
168
169 /* read parents */
169 /* read parents */
170 if (len < 40)
170 if (len < 40)
171 goto quit;
171 goto quit;
172
172
173 parents = Py_BuildValue("s#s#", str, 20, str + 20, 20);
173 parents = Py_BuildValue("s#s#", str, 20, str + 20, 20);
174 if (!parents)
174 if (!parents)
175 goto quit;
175 goto quit;
176
176
177 /* read filenames */
177 /* read filenames */
178 cur = str + 40;
178 cur = str + 40;
179 end = str + len;
179 end = str + len;
180
180
181 while (cur < end - 17) {
181 while (cur < end - 17) {
182 /* unpack header */
182 /* unpack header */
183 state = *cur;
183 state = *cur;
184 mode = getbe32(cur + 1);
184 mode = getbe32(cur + 1);
185 size = getbe32(cur + 5);
185 size = getbe32(cur + 5);
186 mtime = getbe32(cur + 9);
186 mtime = getbe32(cur + 9);
187 flen = getbe32(cur + 13);
187 flen = getbe32(cur + 13);
188 cur += 17;
188 cur += 17;
189 if (cur + flen > end || cur + flen < cur) {
189 if (cur + flen > end || cur + flen < cur) {
190 PyErr_SetString(PyExc_ValueError, "overflow in dirstate");
190 PyErr_SetString(PyExc_ValueError, "overflow in dirstate");
191 goto quit;
191 goto quit;
192 }
192 }
193
193
194 entry = Py_BuildValue("ciii", state, mode, size, mtime);
194 entry = Py_BuildValue("ciii", state, mode, size, mtime);
195 if (!entry)
195 if (!entry)
196 goto quit;
196 goto quit;
197 PyObject_GC_UnTrack(entry); /* don't waste time with this */
197 PyObject_GC_UnTrack(entry); /* don't waste time with this */
198
198
199 cpos = memchr(cur, 0, flen);
199 cpos = memchr(cur, 0, flen);
200 if (cpos) {
200 if (cpos) {
201 fname = PyBytes_FromStringAndSize(cur, cpos - cur);
201 fname = PyBytes_FromStringAndSize(cur, cpos - cur);
202 cname = PyBytes_FromStringAndSize(cpos + 1,
202 cname = PyBytes_FromStringAndSize(cpos + 1,
203 flen - (cpos - cur) - 1);
203 flen - (cpos - cur) - 1);
204 if (!fname || !cname ||
204 if (!fname || !cname ||
205 PyDict_SetItem(cmap, fname, cname) == -1 ||
205 PyDict_SetItem(cmap, fname, cname) == -1 ||
206 PyDict_SetItem(dmap, fname, entry) == -1)
206 PyDict_SetItem(dmap, fname, entry) == -1)
207 goto quit;
207 goto quit;
208 Py_DECREF(cname);
208 Py_DECREF(cname);
209 } else {
209 } else {
210 fname = PyBytes_FromStringAndSize(cur, flen);
210 fname = PyBytes_FromStringAndSize(cur, flen);
211 if (!fname ||
211 if (!fname ||
212 PyDict_SetItem(dmap, fname, entry) == -1)
212 PyDict_SetItem(dmap, fname, entry) == -1)
213 goto quit;
213 goto quit;
214 }
214 }
215 cur += flen;
215 cur += flen;
216 Py_DECREF(fname);
216 Py_DECREF(fname);
217 Py_DECREF(entry);
217 Py_DECREF(entry);
218 fname = cname = entry = NULL;
218 fname = cname = entry = NULL;
219 }
219 }
220
220
221 ret = parents;
221 ret = parents;
222 Py_INCREF(ret);
222 Py_INCREF(ret);
223 quit:
223 quit:
224 Py_XDECREF(fname);
224 Py_XDECREF(fname);
225 Py_XDECREF(cname);
225 Py_XDECREF(cname);
226 Py_XDECREF(entry);
226 Py_XDECREF(entry);
227 Py_XDECREF(parents);
227 Py_XDECREF(parents);
228 return ret;
228 return ret;
229 }
229 }
230
230
231 static inline int getintat(PyObject *tuple, int off, uint32_t *v)
231 static inline int getintat(PyObject *tuple, int off, uint32_t *v)
232 {
232 {
233 PyObject *o = PyTuple_GET_ITEM(tuple, off);
233 PyObject *o = PyTuple_GET_ITEM(tuple, off);
234 long val;
234 long val;
235
235
236 if (PyInt_Check(o))
236 if (PyInt_Check(o))
237 val = PyInt_AS_LONG(o);
237 val = PyInt_AS_LONG(o);
238 else if (PyLong_Check(o)) {
238 else if (PyLong_Check(o)) {
239 val = PyLong_AsLong(o);
239 val = PyLong_AsLong(o);
240 if (val == -1 && PyErr_Occurred())
240 if (val == -1 && PyErr_Occurred())
241 return -1;
241 return -1;
242 } else {
242 } else {
243 PyErr_SetString(PyExc_TypeError, "expected an int or long");
243 PyErr_SetString(PyExc_TypeError, "expected an int or long");
244 return -1;
244 return -1;
245 }
245 }
246 if (LONG_MAX > INT_MAX && (val > INT_MAX || val < INT_MIN)) {
246 if (LONG_MAX > INT_MAX && (val > INT_MAX || val < INT_MIN)) {
247 PyErr_SetString(PyExc_OverflowError,
247 PyErr_SetString(PyExc_OverflowError,
248 "Python value to large to convert to uint32_t");
248 "Python value to large to convert to uint32_t");
249 return -1;
249 return -1;
250 }
250 }
251 *v = (uint32_t)val;
251 *v = (uint32_t)val;
252 return 0;
252 return 0;
253 }
253 }
254
254
255 static PyObject *dirstate_unset;
255 static PyObject *dirstate_unset;
256
256
257 /*
257 /*
258 * Efficiently pack a dirstate object into its on-disk format.
258 * Efficiently pack a dirstate object into its on-disk format.
259 */
259 */
260 static PyObject *pack_dirstate(PyObject *self, PyObject *args)
260 static PyObject *pack_dirstate(PyObject *self, PyObject *args)
261 {
261 {
262 PyObject *packobj = NULL;
262 PyObject *packobj = NULL;
263 PyObject *map, *copymap, *pl;
263 PyObject *map, *copymap, *pl;
264 Py_ssize_t nbytes, pos, l;
264 Py_ssize_t nbytes, pos, l;
265 PyObject *k, *v, *pn;
265 PyObject *k, *v, *pn;
266 char *p, *s;
266 char *p, *s;
267 double now;
267 double now;
268
268
269 if (!PyArg_ParseTuple(args, "O!O!Od:pack_dirstate",
269 if (!PyArg_ParseTuple(args, "O!O!Od:pack_dirstate",
270 &PyDict_Type, &map, &PyDict_Type, &copymap,
270 &PyDict_Type, &map, &PyDict_Type, &copymap,
271 &pl, &now))
271 &pl, &now))
272 return NULL;
272 return NULL;
273
273
274 if (!PySequence_Check(pl) || PySequence_Size(pl) != 2) {
274 if (!PySequence_Check(pl) || PySequence_Size(pl) != 2) {
275 PyErr_SetString(PyExc_TypeError, "expected 2-element sequence");
275 PyErr_SetString(PyExc_TypeError, "expected 2-element sequence");
276 return NULL;
276 return NULL;
277 }
277 }
278
278
279 /* Figure out how much we need to allocate. */
279 /* Figure out how much we need to allocate. */
280 for (nbytes = 40, pos = 0; PyDict_Next(map, &pos, &k, &v);) {
280 for (nbytes = 40, pos = 0; PyDict_Next(map, &pos, &k, &v);) {
281 PyObject *c;
281 PyObject *c;
282 if (!PyString_Check(k)) {
282 if (!PyString_Check(k)) {
283 PyErr_SetString(PyExc_TypeError, "expected string key");
283 PyErr_SetString(PyExc_TypeError, "expected string key");
284 goto bail;
284 goto bail;
285 }
285 }
286 nbytes += PyString_GET_SIZE(k) + 17;
286 nbytes += PyString_GET_SIZE(k) + 17;
287 c = PyDict_GetItem(copymap, k);
287 c = PyDict_GetItem(copymap, k);
288 if (c) {
288 if (c) {
289 if (!PyString_Check(c)) {
289 if (!PyString_Check(c)) {
290 PyErr_SetString(PyExc_TypeError,
290 PyErr_SetString(PyExc_TypeError,
291 "expected string key");
291 "expected string key");
292 goto bail;
292 goto bail;
293 }
293 }
294 nbytes += PyString_GET_SIZE(c) + 1;
294 nbytes += PyString_GET_SIZE(c) + 1;
295 }
295 }
296 }
296 }
297
297
298 packobj = PyString_FromStringAndSize(NULL, nbytes);
298 packobj = PyString_FromStringAndSize(NULL, nbytes);
299 if (packobj == NULL)
299 if (packobj == NULL)
300 goto bail;
300 goto bail;
301
301
302 p = PyString_AS_STRING(packobj);
302 p = PyString_AS_STRING(packobj);
303
303
304 pn = PySequence_ITEM(pl, 0);
304 pn = PySequence_ITEM(pl, 0);
305 if (PyString_AsStringAndSize(pn, &s, &l) == -1 || l != 20) {
305 if (PyString_AsStringAndSize(pn, &s, &l) == -1 || l != 20) {
306 PyErr_SetString(PyExc_TypeError, "expected a 20-byte hash");
306 PyErr_SetString(PyExc_TypeError, "expected a 20-byte hash");
307 goto bail;
307 goto bail;
308 }
308 }
309 memcpy(p, s, l);
309 memcpy(p, s, l);
310 p += 20;
310 p += 20;
311 pn = PySequence_ITEM(pl, 1);
311 pn = PySequence_ITEM(pl, 1);
312 if (PyString_AsStringAndSize(pn, &s, &l) == -1 || l != 20) {
312 if (PyString_AsStringAndSize(pn, &s, &l) == -1 || l != 20) {
313 PyErr_SetString(PyExc_TypeError, "expected a 20-byte hash");
313 PyErr_SetString(PyExc_TypeError, "expected a 20-byte hash");
314 goto bail;
314 goto bail;
315 }
315 }
316 memcpy(p, s, l);
316 memcpy(p, s, l);
317 p += 20;
317 p += 20;
318
318
319 for (pos = 0; PyDict_Next(map, &pos, &k, &v); ) {
319 for (pos = 0; PyDict_Next(map, &pos, &k, &v); ) {
320 uint32_t mode, size, mtime;
320 uint32_t mode, size, mtime;
321 Py_ssize_t len, l;
321 Py_ssize_t len, l;
322 PyObject *o;
322 PyObject *o;
323 char *s, *t;
323 char *s, *t;
324
324
325 if (!PyTuple_Check(v) || PyTuple_GET_SIZE(v) != 4) {
325 if (!PyTuple_Check(v) || PyTuple_GET_SIZE(v) != 4) {
326 PyErr_SetString(PyExc_TypeError, "expected a 4-tuple");
326 PyErr_SetString(PyExc_TypeError, "expected a 4-tuple");
327 goto bail;
327 goto bail;
328 }
328 }
329 o = PyTuple_GET_ITEM(v, 0);
329 o = PyTuple_GET_ITEM(v, 0);
330 if (PyString_AsStringAndSize(o, &s, &l) == -1 || l != 1) {
330 if (PyString_AsStringAndSize(o, &s, &l) == -1 || l != 1) {
331 PyErr_SetString(PyExc_TypeError, "expected one byte");
331 PyErr_SetString(PyExc_TypeError, "expected one byte");
332 goto bail;
332 goto bail;
333 }
333 }
334 *p++ = *s;
334 *p++ = *s;
335 if (getintat(v, 1, &mode) == -1)
335 if (getintat(v, 1, &mode) == -1)
336 goto bail;
336 goto bail;
337 if (getintat(v, 2, &size) == -1)
337 if (getintat(v, 2, &size) == -1)
338 goto bail;
338 goto bail;
339 if (getintat(v, 3, &mtime) == -1)
339 if (getintat(v, 3, &mtime) == -1)
340 goto bail;
340 goto bail;
341 if (*s == 'n' && mtime == (uint32_t)now) {
341 if (*s == 'n' && mtime == (uint32_t)now) {
342 /* See pure/parsers.py:pack_dirstate for why we do
342 /* See pure/parsers.py:pack_dirstate for why we do
343 * this. */
343 * this. */
344 if (PyDict_SetItem(map, k, dirstate_unset) == -1)
344 if (PyDict_SetItem(map, k, dirstate_unset) == -1)
345 goto bail;
345 goto bail;
346 mtime = -1;
346 mtime = -1;
347 }
347 }
348 putbe32(mode, p);
348 putbe32(mode, p);
349 putbe32(size, p + 4);
349 putbe32(size, p + 4);
350 putbe32(mtime, p + 8);
350 putbe32(mtime, p + 8);
351 t = p + 12;
351 t = p + 12;
352 p += 16;
352 p += 16;
353 len = PyString_GET_SIZE(k);
353 len = PyString_GET_SIZE(k);
354 memcpy(p, PyString_AS_STRING(k), len);
354 memcpy(p, PyString_AS_STRING(k), len);
355 p += len;
355 p += len;
356 o = PyDict_GetItem(copymap, k);
356 o = PyDict_GetItem(copymap, k);
357 if (o) {
357 if (o) {
358 *p++ = '\0';
358 *p++ = '\0';
359 l = PyString_GET_SIZE(o);
359 l = PyString_GET_SIZE(o);
360 memcpy(p, PyString_AS_STRING(o), l);
360 memcpy(p, PyString_AS_STRING(o), l);
361 p += l;
361 p += l;
362 len += l + 1;
362 len += l + 1;
363 }
363 }
364 putbe32((uint32_t)len, t);
364 putbe32((uint32_t)len, t);
365 }
365 }
366
366
367 pos = p - PyString_AS_STRING(packobj);
367 pos = p - PyString_AS_STRING(packobj);
368 if (pos != nbytes) {
368 if (pos != nbytes) {
369 PyErr_Format(PyExc_SystemError, "bad dirstate size: %ld != %ld",
369 PyErr_Format(PyExc_SystemError, "bad dirstate size: %ld != %ld",
370 (long)pos, (long)nbytes);
370 (long)pos, (long)nbytes);
371 goto bail;
371 goto bail;
372 }
372 }
373
373
374 return packobj;
374 return packobj;
375 bail:
375 bail:
376 Py_XDECREF(packobj);
376 Py_XDECREF(packobj);
377 return NULL;
377 return NULL;
378 }
378 }
379
379
380 /*
380 /*
381 * A base-16 trie for fast node->rev mapping.
381 * A base-16 trie for fast node->rev mapping.
382 *
382 *
383 * Positive value is index of the next node in the trie
383 * Positive value is index of the next node in the trie
384 * Negative value is a leaf: -(rev + 1)
384 * Negative value is a leaf: -(rev + 1)
385 * Zero is empty
385 * Zero is empty
386 */
386 */
387 typedef struct {
387 typedef struct {
388 int children[16];
388 int children[16];
389 } nodetree;
389 } nodetree;
390
390
391 /*
391 /*
392 * This class has two behaviours.
392 * This class has two behaviours.
393 *
393 *
394 * When used in a list-like way (with integer keys), we decode an
394 * When used in a list-like way (with integer keys), we decode an
395 * entry in a RevlogNG index file on demand. Our last entry is a
395 * entry in a RevlogNG index file on demand. Our last entry is a
396 * sentinel, always a nullid. We have limited support for
396 * sentinel, always a nullid. We have limited support for
397 * integer-keyed insert and delete, only at elements right before the
397 * integer-keyed insert and delete, only at elements right before the
398 * sentinel.
398 * sentinel.
399 *
399 *
400 * With string keys, we lazily perform a reverse mapping from node to
400 * With string keys, we lazily perform a reverse mapping from node to
401 * rev, using a base-16 trie.
401 * rev, using a base-16 trie.
402 */
402 */
403 typedef struct {
403 typedef struct {
404 PyObject_HEAD
404 PyObject_HEAD
405 /* Type-specific fields go here. */
405 /* Type-specific fields go here. */
406 PyObject *data; /* raw bytes of index */
406 PyObject *data; /* raw bytes of index */
407 PyObject **cache; /* cached tuples */
407 PyObject **cache; /* cached tuples */
408 const char **offsets; /* populated on demand */
408 const char **offsets; /* populated on demand */
409 Py_ssize_t raw_length; /* original number of elements */
409 Py_ssize_t raw_length; /* original number of elements */
410 Py_ssize_t length; /* current number of elements */
410 Py_ssize_t length; /* current number of elements */
411 PyObject *added; /* populated on demand */
411 PyObject *added; /* populated on demand */
412 PyObject *headrevs; /* cache, invalidated on changes */
412 PyObject *headrevs; /* cache, invalidated on changes */
413 nodetree *nt; /* base-16 trie */
413 nodetree *nt; /* base-16 trie */
414 int ntlength; /* # nodes in use */
414 int ntlength; /* # nodes in use */
415 int ntcapacity; /* # nodes allocated */
415 int ntcapacity; /* # nodes allocated */
416 int ntdepth; /* maximum depth of tree */
416 int ntdepth; /* maximum depth of tree */
417 int ntsplits; /* # splits performed */
417 int ntsplits; /* # splits performed */
418 int ntrev; /* last rev scanned */
418 int ntrev; /* last rev scanned */
419 int ntlookups; /* # lookups */
419 int ntlookups; /* # lookups */
420 int ntmisses; /* # lookups that miss the cache */
420 int ntmisses; /* # lookups that miss the cache */
421 int inlined;
421 int inlined;
422 } indexObject;
422 } indexObject;
423
423
424 static Py_ssize_t index_length(const indexObject *self)
424 static Py_ssize_t index_length(const indexObject *self)
425 {
425 {
426 if (self->added == NULL)
426 if (self->added == NULL)
427 return self->length;
427 return self->length;
428 return self->length + PyList_GET_SIZE(self->added);
428 return self->length + PyList_GET_SIZE(self->added);
429 }
429 }
430
430
431 static PyObject *nullentry;
431 static PyObject *nullentry;
432 static const char nullid[20];
432 static const char nullid[20];
433
433
434 static long inline_scan(indexObject *self, const char **offsets);
434 static long inline_scan(indexObject *self, const char **offsets);
435
435
436 #if LONG_MAX == 0x7fffffffL
436 #if LONG_MAX == 0x7fffffffL
437 static char *tuple_format = "Kiiiiiis#";
437 static char *tuple_format = "Kiiiiiis#";
438 #else
438 #else
439 static char *tuple_format = "kiiiiiis#";
439 static char *tuple_format = "kiiiiiis#";
440 #endif
440 #endif
441
441
442 /* A RevlogNG v1 index entry is 64 bytes long. */
442 /* A RevlogNG v1 index entry is 64 bytes long. */
443 static const long v1_hdrsize = 64;
443 static const long v1_hdrsize = 64;
444
444
445 /*
445 /*
446 * Return a pointer to the beginning of a RevlogNG record.
446 * Return a pointer to the beginning of a RevlogNG record.
447 */
447 */
448 static const char *index_deref(indexObject *self, Py_ssize_t pos)
448 static const char *index_deref(indexObject *self, Py_ssize_t pos)
449 {
449 {
450 if (self->inlined && pos > 0) {
450 if (self->inlined && pos > 0) {
451 if (self->offsets == NULL) {
451 if (self->offsets == NULL) {
452 self->offsets = malloc(self->raw_length *
452 self->offsets = malloc(self->raw_length *
453 sizeof(*self->offsets));
453 sizeof(*self->offsets));
454 if (self->offsets == NULL)
454 if (self->offsets == NULL)
455 return (const char *)PyErr_NoMemory();
455 return (const char *)PyErr_NoMemory();
456 inline_scan(self, self->offsets);
456 inline_scan(self, self->offsets);
457 }
457 }
458 return self->offsets[pos];
458 return self->offsets[pos];
459 }
459 }
460
460
461 return PyString_AS_STRING(self->data) + pos * v1_hdrsize;
461 return PyString_AS_STRING(self->data) + pos * v1_hdrsize;
462 }
462 }
463
463
464 /*
464 /*
465 * RevlogNG format (all in big endian, data may be inlined):
465 * RevlogNG format (all in big endian, data may be inlined):
466 * 6 bytes: offset
466 * 6 bytes: offset
467 * 2 bytes: flags
467 * 2 bytes: flags
468 * 4 bytes: compressed length
468 * 4 bytes: compressed length
469 * 4 bytes: uncompressed length
469 * 4 bytes: uncompressed length
470 * 4 bytes: base revision
470 * 4 bytes: base revision
471 * 4 bytes: link revision
471 * 4 bytes: link revision
472 * 4 bytes: parent 1 revision
472 * 4 bytes: parent 1 revision
473 * 4 bytes: parent 2 revision
473 * 4 bytes: parent 2 revision
474 * 32 bytes: nodeid (only 20 bytes used)
474 * 32 bytes: nodeid (only 20 bytes used)
475 */
475 */
476 static PyObject *index_get(indexObject *self, Py_ssize_t pos)
476 static PyObject *index_get(indexObject *self, Py_ssize_t pos)
477 {
477 {
478 uint64_t offset_flags;
478 uint64_t offset_flags;
479 int comp_len, uncomp_len, base_rev, link_rev, parent_1, parent_2;
479 int comp_len, uncomp_len, base_rev, link_rev, parent_1, parent_2;
480 const char *c_node_id;
480 const char *c_node_id;
481 const char *data;
481 const char *data;
482 Py_ssize_t length = index_length(self);
482 Py_ssize_t length = index_length(self);
483 PyObject *entry;
483 PyObject *entry;
484
484
485 if (pos < 0)
485 if (pos < 0)
486 pos += length;
486 pos += length;
487
487
488 if (pos < 0 || pos >= length) {
488 if (pos < 0 || pos >= length) {
489 PyErr_SetString(PyExc_IndexError, "revlog index out of range");
489 PyErr_SetString(PyExc_IndexError, "revlog index out of range");
490 return NULL;
490 return NULL;
491 }
491 }
492
492
493 if (pos == length - 1) {
493 if (pos == length - 1) {
494 Py_INCREF(nullentry);
494 Py_INCREF(nullentry);
495 return nullentry;
495 return nullentry;
496 }
496 }
497
497
498 if (pos >= self->length - 1) {
498 if (pos >= self->length - 1) {
499 PyObject *obj;
499 PyObject *obj;
500 obj = PyList_GET_ITEM(self->added, pos - self->length + 1);
500 obj = PyList_GET_ITEM(self->added, pos - self->length + 1);
501 Py_INCREF(obj);
501 Py_INCREF(obj);
502 return obj;
502 return obj;
503 }
503 }
504
504
505 if (self->cache) {
505 if (self->cache) {
506 if (self->cache[pos]) {
506 if (self->cache[pos]) {
507 Py_INCREF(self->cache[pos]);
507 Py_INCREF(self->cache[pos]);
508 return self->cache[pos];
508 return self->cache[pos];
509 }
509 }
510 } else {
510 } else {
511 self->cache = calloc(self->raw_length, sizeof(PyObject *));
511 self->cache = calloc(self->raw_length, sizeof(PyObject *));
512 if (self->cache == NULL)
512 if (self->cache == NULL)
513 return PyErr_NoMemory();
513 return PyErr_NoMemory();
514 }
514 }
515
515
516 data = index_deref(self, pos);
516 data = index_deref(self, pos);
517 if (data == NULL)
517 if (data == NULL)
518 return NULL;
518 return NULL;
519
519
520 offset_flags = getbe32(data + 4);
520 offset_flags = getbe32(data + 4);
521 if (pos == 0) /* mask out version number for the first entry */
521 if (pos == 0) /* mask out version number for the first entry */
522 offset_flags &= 0xFFFF;
522 offset_flags &= 0xFFFF;
523 else {
523 else {
524 uint32_t offset_high = getbe32(data);
524 uint32_t offset_high = getbe32(data);
525 offset_flags |= ((uint64_t)offset_high) << 32;
525 offset_flags |= ((uint64_t)offset_high) << 32;
526 }
526 }
527
527
528 comp_len = getbe32(data + 8);
528 comp_len = getbe32(data + 8);
529 uncomp_len = getbe32(data + 12);
529 uncomp_len = getbe32(data + 12);
530 base_rev = getbe32(data + 16);
530 base_rev = getbe32(data + 16);
531 link_rev = getbe32(data + 20);
531 link_rev = getbe32(data + 20);
532 parent_1 = getbe32(data + 24);
532 parent_1 = getbe32(data + 24);
533 parent_2 = getbe32(data + 28);
533 parent_2 = getbe32(data + 28);
534 c_node_id = data + 32;
534 c_node_id = data + 32;
535
535
536 entry = Py_BuildValue(tuple_format, offset_flags, comp_len,
536 entry = Py_BuildValue(tuple_format, offset_flags, comp_len,
537 uncomp_len, base_rev, link_rev,
537 uncomp_len, base_rev, link_rev,
538 parent_1, parent_2, c_node_id, 20);
538 parent_1, parent_2, c_node_id, 20);
539
539
540 if (entry) {
540 if (entry) {
541 PyObject_GC_UnTrack(entry);
541 PyObject_GC_UnTrack(entry);
542 Py_INCREF(entry);
542 Py_INCREF(entry);
543 }
543 }
544
544
545 self->cache[pos] = entry;
545 self->cache[pos] = entry;
546
546
547 return entry;
547 return entry;
548 }
548 }
549
549
550 /*
550 /*
551 * Return the 20-byte SHA of the node corresponding to the given rev.
551 * Return the 20-byte SHA of the node corresponding to the given rev.
552 */
552 */
553 static const char *index_node(indexObject *self, Py_ssize_t pos)
553 static const char *index_node(indexObject *self, Py_ssize_t pos)
554 {
554 {
555 Py_ssize_t length = index_length(self);
555 Py_ssize_t length = index_length(self);
556 const char *data;
556 const char *data;
557
557
558 if (pos == length - 1 || pos == INT_MAX)
558 if (pos == length - 1 || pos == INT_MAX)
559 return nullid;
559 return nullid;
560
560
561 if (pos >= length)
561 if (pos >= length)
562 return NULL;
562 return NULL;
563
563
564 if (pos >= self->length - 1) {
564 if (pos >= self->length - 1) {
565 PyObject *tuple, *str;
565 PyObject *tuple, *str;
566 tuple = PyList_GET_ITEM(self->added, pos - self->length + 1);
566 tuple = PyList_GET_ITEM(self->added, pos - self->length + 1);
567 str = PyTuple_GetItem(tuple, 7);
567 str = PyTuple_GetItem(tuple, 7);
568 return str ? PyString_AS_STRING(str) : NULL;
568 return str ? PyString_AS_STRING(str) : NULL;
569 }
569 }
570
570
571 data = index_deref(self, pos);
571 data = index_deref(self, pos);
572 return data ? data + 32 : NULL;
572 return data ? data + 32 : NULL;
573 }
573 }
574
574
575 static int nt_insert(indexObject *self, const char *node, int rev);
575 static int nt_insert(indexObject *self, const char *node, int rev);
576
576
577 static int node_check(PyObject *obj, char **node, Py_ssize_t *nodelen)
577 static int node_check(PyObject *obj, char **node, Py_ssize_t *nodelen)
578 {
578 {
579 if (PyString_AsStringAndSize(obj, node, nodelen) == -1)
579 if (PyString_AsStringAndSize(obj, node, nodelen) == -1)
580 return -1;
580 return -1;
581 if (*nodelen == 20)
581 if (*nodelen == 20)
582 return 0;
582 return 0;
583 PyErr_SetString(PyExc_ValueError, "20-byte hash required");
583 PyErr_SetString(PyExc_ValueError, "20-byte hash required");
584 return -1;
584 return -1;
585 }
585 }
586
586
587 static PyObject *index_insert(indexObject *self, PyObject *args)
587 static PyObject *index_insert(indexObject *self, PyObject *args)
588 {
588 {
589 PyObject *obj;
589 PyObject *obj;
590 char *node;
590 char *node;
591 long offset;
591 long offset;
592 Py_ssize_t len, nodelen;
592 Py_ssize_t len, nodelen;
593
593
594 if (!PyArg_ParseTuple(args, "lO", &offset, &obj))
594 if (!PyArg_ParseTuple(args, "lO", &offset, &obj))
595 return NULL;
595 return NULL;
596
596
597 if (!PyTuple_Check(obj) || PyTuple_GET_SIZE(obj) != 8) {
597 if (!PyTuple_Check(obj) || PyTuple_GET_SIZE(obj) != 8) {
598 PyErr_SetString(PyExc_TypeError, "8-tuple required");
598 PyErr_SetString(PyExc_TypeError, "8-tuple required");
599 return NULL;
599 return NULL;
600 }
600 }
601
601
602 if (node_check(PyTuple_GET_ITEM(obj, 7), &node, &nodelen) == -1)
602 if (node_check(PyTuple_GET_ITEM(obj, 7), &node, &nodelen) == -1)
603 return NULL;
603 return NULL;
604
604
605 len = index_length(self);
605 len = index_length(self);
606
606
607 if (offset < 0)
607 if (offset < 0)
608 offset += len;
608 offset += len;
609
609
610 if (offset != len - 1) {
610 if (offset != len - 1) {
611 PyErr_SetString(PyExc_IndexError,
611 PyErr_SetString(PyExc_IndexError,
612 "insert only supported at index -1");
612 "insert only supported at index -1");
613 return NULL;
613 return NULL;
614 }
614 }
615
615
616 if (offset > INT_MAX) {
616 if (offset > INT_MAX) {
617 PyErr_SetString(PyExc_ValueError,
617 PyErr_SetString(PyExc_ValueError,
618 "currently only 2**31 revs supported");
618 "currently only 2**31 revs supported");
619 return NULL;
619 return NULL;
620 }
620 }
621
621
622 if (self->added == NULL) {
622 if (self->added == NULL) {
623 self->added = PyList_New(0);
623 self->added = PyList_New(0);
624 if (self->added == NULL)
624 if (self->added == NULL)
625 return NULL;
625 return NULL;
626 }
626 }
627
627
628 if (PyList_Append(self->added, obj) == -1)
628 if (PyList_Append(self->added, obj) == -1)
629 return NULL;
629 return NULL;
630
630
631 if (self->nt)
631 if (self->nt)
632 nt_insert(self, node, (int)offset);
632 nt_insert(self, node, (int)offset);
633
633
634 Py_CLEAR(self->headrevs);
634 Py_CLEAR(self->headrevs);
635 Py_RETURN_NONE;
635 Py_RETURN_NONE;
636 }
636 }
637
637
638 static void _index_clearcaches(indexObject *self)
638 static void _index_clearcaches(indexObject *self)
639 {
639 {
640 if (self->cache) {
640 if (self->cache) {
641 Py_ssize_t i;
641 Py_ssize_t i;
642
642
643 for (i = 0; i < self->raw_length; i++)
643 for (i = 0; i < self->raw_length; i++)
644 Py_CLEAR(self->cache[i]);
644 Py_CLEAR(self->cache[i]);
645 free(self->cache);
645 free(self->cache);
646 self->cache = NULL;
646 self->cache = NULL;
647 }
647 }
648 if (self->offsets) {
648 if (self->offsets) {
649 free(self->offsets);
649 free(self->offsets);
650 self->offsets = NULL;
650 self->offsets = NULL;
651 }
651 }
652 if (self->nt) {
652 if (self->nt) {
653 free(self->nt);
653 free(self->nt);
654 self->nt = NULL;
654 self->nt = NULL;
655 }
655 }
656 Py_CLEAR(self->headrevs);
656 Py_CLEAR(self->headrevs);
657 }
657 }
658
658
659 static PyObject *index_clearcaches(indexObject *self)
659 static PyObject *index_clearcaches(indexObject *self)
660 {
660 {
661 _index_clearcaches(self);
661 _index_clearcaches(self);
662 self->ntlength = self->ntcapacity = 0;
662 self->ntlength = self->ntcapacity = 0;
663 self->ntdepth = self->ntsplits = 0;
663 self->ntdepth = self->ntsplits = 0;
664 self->ntrev = -1;
664 self->ntrev = -1;
665 self->ntlookups = self->ntmisses = 0;
665 self->ntlookups = self->ntmisses = 0;
666 Py_RETURN_NONE;
666 Py_RETURN_NONE;
667 }
667 }
668
668
669 static PyObject *index_stats(indexObject *self)
669 static PyObject *index_stats(indexObject *self)
670 {
670 {
671 PyObject *obj = PyDict_New();
671 PyObject *obj = PyDict_New();
672
672
673 if (obj == NULL)
673 if (obj == NULL)
674 return NULL;
674 return NULL;
675
675
676 #define istat(__n, __d) \
676 #define istat(__n, __d) \
677 if (PyDict_SetItemString(obj, __d, PyInt_FromSsize_t(self->__n)) == -1) \
677 if (PyDict_SetItemString(obj, __d, PyInt_FromSsize_t(self->__n)) == -1) \
678 goto bail;
678 goto bail;
679
679
680 if (self->added) {
680 if (self->added) {
681 Py_ssize_t len = PyList_GET_SIZE(self->added);
681 Py_ssize_t len = PyList_GET_SIZE(self->added);
682 if (PyDict_SetItemString(obj, "index entries added",
682 if (PyDict_SetItemString(obj, "index entries added",
683 PyInt_FromSsize_t(len)) == -1)
683 PyInt_FromSsize_t(len)) == -1)
684 goto bail;
684 goto bail;
685 }
685 }
686
686
687 if (self->raw_length != self->length - 1)
687 if (self->raw_length != self->length - 1)
688 istat(raw_length, "revs on disk");
688 istat(raw_length, "revs on disk");
689 istat(length, "revs in memory");
689 istat(length, "revs in memory");
690 istat(ntcapacity, "node trie capacity");
690 istat(ntcapacity, "node trie capacity");
691 istat(ntdepth, "node trie depth");
691 istat(ntdepth, "node trie depth");
692 istat(ntlength, "node trie count");
692 istat(ntlength, "node trie count");
693 istat(ntlookups, "node trie lookups");
693 istat(ntlookups, "node trie lookups");
694 istat(ntmisses, "node trie misses");
694 istat(ntmisses, "node trie misses");
695 istat(ntrev, "node trie last rev scanned");
695 istat(ntrev, "node trie last rev scanned");
696 istat(ntsplits, "node trie splits");
696 istat(ntsplits, "node trie splits");
697
697
698 #undef istat
698 #undef istat
699
699
700 return obj;
700 return obj;
701
701
702 bail:
702 bail:
703 Py_XDECREF(obj);
703 Py_XDECREF(obj);
704 return NULL;
704 return NULL;
705 }
705 }
706
706
707 /*
707 /*
708 * When we cache a list, we want to be sure the caller can't mutate
708 * When we cache a list, we want to be sure the caller can't mutate
709 * the cached copy.
709 * the cached copy.
710 */
710 */
711 static PyObject *list_copy(PyObject *list)
711 static PyObject *list_copy(PyObject *list)
712 {
712 {
713 Py_ssize_t len = PyList_GET_SIZE(list);
713 Py_ssize_t len = PyList_GET_SIZE(list);
714 PyObject *newlist = PyList_New(len);
714 PyObject *newlist = PyList_New(len);
715 Py_ssize_t i;
715 Py_ssize_t i;
716
716
717 if (newlist == NULL)
717 if (newlist == NULL)
718 return NULL;
718 return NULL;
719
719
720 for (i = 0; i < len; i++) {
720 for (i = 0; i < len; i++) {
721 PyObject *obj = PyList_GET_ITEM(list, i);
721 PyObject *obj = PyList_GET_ITEM(list, i);
722 Py_INCREF(obj);
722 Py_INCREF(obj);
723 PyList_SET_ITEM(newlist, i, obj);
723 PyList_SET_ITEM(newlist, i, obj);
724 }
724 }
725
725
726 return newlist;
726 return newlist;
727 }
727 }
728
728
729 static PyObject *index_headrevs(indexObject *self)
729 static PyObject *index_headrevs(indexObject *self)
730 {
730 {
731 Py_ssize_t i, len, addlen;
731 Py_ssize_t i, len, addlen;
732 char *nothead = NULL;
732 char *nothead = NULL;
733 PyObject *heads;
733 PyObject *heads;
734
734
735 if (self->headrevs)
735 if (self->headrevs)
736 return list_copy(self->headrevs);
736 return list_copy(self->headrevs);
737
737
738 len = index_length(self) - 1;
738 len = index_length(self) - 1;
739 heads = PyList_New(0);
739 heads = PyList_New(0);
740 if (heads == NULL)
740 if (heads == NULL)
741 goto bail;
741 goto bail;
742 if (len == 0) {
742 if (len == 0) {
743 PyObject *nullid = PyInt_FromLong(-1);
743 PyObject *nullid = PyInt_FromLong(-1);
744 if (nullid == NULL || PyList_Append(heads, nullid) == -1) {
744 if (nullid == NULL || PyList_Append(heads, nullid) == -1) {
745 Py_XDECREF(nullid);
745 Py_XDECREF(nullid);
746 goto bail;
746 goto bail;
747 }
747 }
748 goto done;
748 goto done;
749 }
749 }
750
750
751 nothead = calloc(len, 1);
751 nothead = calloc(len, 1);
752 if (nothead == NULL)
752 if (nothead == NULL)
753 goto bail;
753 goto bail;
754
754
755 for (i = 0; i < self->raw_length; i++) {
755 for (i = 0; i < self->raw_length; i++) {
756 const char *data = index_deref(self, i);
756 const char *data = index_deref(self, i);
757 int parent_1 = getbe32(data + 24);
757 int parent_1 = getbe32(data + 24);
758 int parent_2 = getbe32(data + 28);
758 int parent_2 = getbe32(data + 28);
759 if (parent_1 >= 0)
759 if (parent_1 >= 0)
760 nothead[parent_1] = 1;
760 nothead[parent_1] = 1;
761 if (parent_2 >= 0)
761 if (parent_2 >= 0)
762 nothead[parent_2] = 1;
762 nothead[parent_2] = 1;
763 }
763 }
764
764
765 addlen = self->added ? PyList_GET_SIZE(self->added) : 0;
765 addlen = self->added ? PyList_GET_SIZE(self->added) : 0;
766
766
767 for (i = 0; i < addlen; i++) {
767 for (i = 0; i < addlen; i++) {
768 PyObject *rev = PyList_GET_ITEM(self->added, i);
768 PyObject *rev = PyList_GET_ITEM(self->added, i);
769 PyObject *p1 = PyTuple_GET_ITEM(rev, 5);
769 PyObject *p1 = PyTuple_GET_ITEM(rev, 5);
770 PyObject *p2 = PyTuple_GET_ITEM(rev, 6);
770 PyObject *p2 = PyTuple_GET_ITEM(rev, 6);
771 long parent_1, parent_2;
771 long parent_1, parent_2;
772
772
773 if (!PyInt_Check(p1) || !PyInt_Check(p2)) {
773 if (!PyInt_Check(p1) || !PyInt_Check(p2)) {
774 PyErr_SetString(PyExc_TypeError,
774 PyErr_SetString(PyExc_TypeError,
775 "revlog parents are invalid");
775 "revlog parents are invalid");
776 goto bail;
776 goto bail;
777 }
777 }
778 parent_1 = PyInt_AS_LONG(p1);
778 parent_1 = PyInt_AS_LONG(p1);
779 parent_2 = PyInt_AS_LONG(p2);
779 parent_2 = PyInt_AS_LONG(p2);
780 if (parent_1 >= 0)
780 if (parent_1 >= 0)
781 nothead[parent_1] = 1;
781 nothead[parent_1] = 1;
782 if (parent_2 >= 0)
782 if (parent_2 >= 0)
783 nothead[parent_2] = 1;
783 nothead[parent_2] = 1;
784 }
784 }
785
785
786 for (i = 0; i < len; i++) {
786 for (i = 0; i < len; i++) {
787 PyObject *head;
787 PyObject *head;
788
788
789 if (nothead[i])
789 if (nothead[i])
790 continue;
790 continue;
791 head = PyInt_FromLong(i);
791 head = PyInt_FromLong(i);
792 if (head == NULL || PyList_Append(heads, head) == -1) {
792 if (head == NULL || PyList_Append(heads, head) == -1) {
793 Py_XDECREF(head);
793 Py_XDECREF(head);
794 goto bail;
794 goto bail;
795 }
795 }
796 }
796 }
797
797
798 done:
798 done:
799 self->headrevs = heads;
799 self->headrevs = heads;
800 free(nothead);
800 free(nothead);
801 return list_copy(self->headrevs);
801 return list_copy(self->headrevs);
802 bail:
802 bail:
803 Py_XDECREF(heads);
803 Py_XDECREF(heads);
804 free(nothead);
804 free(nothead);
805 return NULL;
805 return NULL;
806 }
806 }
807
807
808 static inline int nt_level(const char *node, Py_ssize_t level)
808 static inline int nt_level(const char *node, Py_ssize_t level)
809 {
809 {
810 int v = node[level>>1];
810 int v = node[level>>1];
811 if (!(level & 1))
811 if (!(level & 1))
812 v >>= 4;
812 v >>= 4;
813 return v & 0xf;
813 return v & 0xf;
814 }
814 }
815
815
816 /*
816 /*
817 * Return values:
817 * Return values:
818 *
818 *
819 * -4: match is ambiguous (multiple candidates)
819 * -4: match is ambiguous (multiple candidates)
820 * -2: not found
820 * -2: not found
821 * rest: valid rev
821 * rest: valid rev
822 */
822 */
823 static int nt_find(indexObject *self, const char *node, Py_ssize_t nodelen,
823 static int nt_find(indexObject *self, const char *node, Py_ssize_t nodelen,
824 int hex)
824 int hex)
825 {
825 {
826 int (*getnybble)(const char *, Py_ssize_t) = hex ? hexdigit : nt_level;
826 int (*getnybble)(const char *, Py_ssize_t) = hex ? hexdigit : nt_level;
827 int level, maxlevel, off;
827 int level, maxlevel, off;
828
828
829 if (nodelen == 20 && node[0] == '\0' && memcmp(node, nullid, 20) == 0)
829 if (nodelen == 20 && node[0] == '\0' && memcmp(node, nullid, 20) == 0)
830 return -1;
830 return -1;
831
831
832 if (self->nt == NULL)
832 if (self->nt == NULL)
833 return -2;
833 return -2;
834
834
835 if (hex)
835 if (hex)
836 maxlevel = nodelen > 40 ? 40 : (int)nodelen;
836 maxlevel = nodelen > 40 ? 40 : (int)nodelen;
837 else
837 else
838 maxlevel = nodelen > 20 ? 40 : ((int)nodelen * 2);
838 maxlevel = nodelen > 20 ? 40 : ((int)nodelen * 2);
839
839
840 for (level = off = 0; level < maxlevel; level++) {
840 for (level = off = 0; level < maxlevel; level++) {
841 int k = getnybble(node, level);
841 int k = getnybble(node, level);
842 nodetree *n = &self->nt[off];
842 nodetree *n = &self->nt[off];
843 int v = n->children[k];
843 int v = n->children[k];
844
844
845 if (v < 0) {
845 if (v < 0) {
846 const char *n;
846 const char *n;
847 Py_ssize_t i;
847 Py_ssize_t i;
848
848
849 v = -v - 1;
849 v = -v - 1;
850 n = index_node(self, v);
850 n = index_node(self, v);
851 if (n == NULL)
851 if (n == NULL)
852 return -2;
852 return -2;
853 for (i = level; i < maxlevel; i++)
853 for (i = level; i < maxlevel; i++)
854 if (getnybble(node, i) != nt_level(n, i))
854 if (getnybble(node, i) != nt_level(n, i))
855 return -2;
855 return -2;
856 return v;
856 return v;
857 }
857 }
858 if (v == 0)
858 if (v == 0)
859 return -2;
859 return -2;
860 off = v;
860 off = v;
861 }
861 }
862 /* multiple matches against an ambiguous prefix */
862 /* multiple matches against an ambiguous prefix */
863 return -4;
863 return -4;
864 }
864 }
865
865
866 static int nt_new(indexObject *self)
866 static int nt_new(indexObject *self)
867 {
867 {
868 if (self->ntlength == self->ntcapacity) {
868 if (self->ntlength == self->ntcapacity) {
869 self->ntcapacity *= 2;
869 self->ntcapacity *= 2;
870 self->nt = realloc(self->nt,
870 self->nt = realloc(self->nt,
871 self->ntcapacity * sizeof(nodetree));
871 self->ntcapacity * sizeof(nodetree));
872 if (self->nt == NULL) {
872 if (self->nt == NULL) {
873 PyErr_SetString(PyExc_MemoryError, "out of memory");
873 PyErr_SetString(PyExc_MemoryError, "out of memory");
874 return -1;
874 return -1;
875 }
875 }
876 memset(&self->nt[self->ntlength], 0,
876 memset(&self->nt[self->ntlength], 0,
877 sizeof(nodetree) * (self->ntcapacity - self->ntlength));
877 sizeof(nodetree) * (self->ntcapacity - self->ntlength));
878 }
878 }
879 return self->ntlength++;
879 return self->ntlength++;
880 }
880 }
881
881
882 static int nt_insert(indexObject *self, const char *node, int rev)
882 static int nt_insert(indexObject *self, const char *node, int rev)
883 {
883 {
884 int level = 0;
884 int level = 0;
885 int off = 0;
885 int off = 0;
886
886
887 while (level < 40) {
887 while (level < 40) {
888 int k = nt_level(node, level);
888 int k = nt_level(node, level);
889 nodetree *n;
889 nodetree *n;
890 int v;
890 int v;
891
891
892 n = &self->nt[off];
892 n = &self->nt[off];
893 v = n->children[k];
893 v = n->children[k];
894
894
895 if (v == 0) {
895 if (v == 0) {
896 n->children[k] = -rev - 1;
896 n->children[k] = -rev - 1;
897 return 0;
897 return 0;
898 }
898 }
899 if (v < 0) {
899 if (v < 0) {
900 const char *oldnode = index_node(self, -v - 1);
900 const char *oldnode = index_node(self, -v - 1);
901 int noff;
901 int noff;
902
902
903 if (!oldnode || !memcmp(oldnode, node, 20)) {
903 if (!oldnode || !memcmp(oldnode, node, 20)) {
904 n->children[k] = -rev - 1;
904 n->children[k] = -rev - 1;
905 return 0;
905 return 0;
906 }
906 }
907 noff = nt_new(self);
907 noff = nt_new(self);
908 if (noff == -1)
908 if (noff == -1)
909 return -1;
909 return -1;
910 /* self->nt may have been changed by realloc */
910 /* self->nt may have been changed by realloc */
911 self->nt[off].children[k] = noff;
911 self->nt[off].children[k] = noff;
912 off = noff;
912 off = noff;
913 n = &self->nt[off];
913 n = &self->nt[off];
914 n->children[nt_level(oldnode, ++level)] = v;
914 n->children[nt_level(oldnode, ++level)] = v;
915 if (level > self->ntdepth)
915 if (level > self->ntdepth)
916 self->ntdepth = level;
916 self->ntdepth = level;
917 self->ntsplits += 1;
917 self->ntsplits += 1;
918 } else {
918 } else {
919 level += 1;
919 level += 1;
920 off = v;
920 off = v;
921 }
921 }
922 }
922 }
923
923
924 return -1;
924 return -1;
925 }
925 }
926
926
927 static int nt_init(indexObject *self)
927 static int nt_init(indexObject *self)
928 {
928 {
929 if (self->nt == NULL) {
929 if (self->nt == NULL) {
930 if (self->raw_length > INT_MAX) {
930 if (self->raw_length > INT_MAX) {
931 PyErr_SetString(PyExc_ValueError, "overflow in nt_init");
931 PyErr_SetString(PyExc_ValueError, "overflow in nt_init");
932 return -1;
932 return -1;
933 }
933 }
934 self->ntcapacity = self->raw_length < 4
934 self->ntcapacity = self->raw_length < 4
935 ? 4 : (int)self->raw_length / 2;
935 ? 4 : (int)self->raw_length / 2;
936
936
937 self->nt = calloc(self->ntcapacity, sizeof(nodetree));
937 self->nt = calloc(self->ntcapacity, sizeof(nodetree));
938 if (self->nt == NULL) {
938 if (self->nt == NULL) {
939 PyErr_NoMemory();
939 PyErr_NoMemory();
940 return -1;
940 return -1;
941 }
941 }
942 self->ntlength = 1;
942 self->ntlength = 1;
943 self->ntrev = (int)index_length(self) - 1;
943 self->ntrev = (int)index_length(self) - 1;
944 self->ntlookups = 1;
944 self->ntlookups = 1;
945 self->ntmisses = 0;
945 self->ntmisses = 0;
946 if (nt_insert(self, nullid, INT_MAX) == -1)
946 if (nt_insert(self, nullid, INT_MAX) == -1)
947 return -1;
947 return -1;
948 }
948 }
949 return 0;
949 return 0;
950 }
950 }
951
951
952 /*
952 /*
953 * Return values:
953 * Return values:
954 *
954 *
955 * -3: error (exception set)
955 * -3: error (exception set)
956 * -2: not found (no exception set)
956 * -2: not found (no exception set)
957 * rest: valid rev
957 * rest: valid rev
958 */
958 */
959 static int index_find_node(indexObject *self,
959 static int index_find_node(indexObject *self,
960 const char *node, Py_ssize_t nodelen)
960 const char *node, Py_ssize_t nodelen)
961 {
961 {
962 int rev;
962 int rev;
963
963
964 self->ntlookups++;
964 self->ntlookups++;
965 rev = nt_find(self, node, nodelen, 0);
965 rev = nt_find(self, node, nodelen, 0);
966 if (rev >= -1)
966 if (rev >= -1)
967 return rev;
967 return rev;
968
968
969 if (nt_init(self) == -1)
969 if (nt_init(self) == -1)
970 return -3;
970 return -3;
971
971
972 /*
972 /*
973 * For the first handful of lookups, we scan the entire index,
973 * For the first handful of lookups, we scan the entire index,
974 * and cache only the matching nodes. This optimizes for cases
974 * and cache only the matching nodes. This optimizes for cases
975 * like "hg tip", where only a few nodes are accessed.
975 * like "hg tip", where only a few nodes are accessed.
976 *
976 *
977 * After that, we cache every node we visit, using a single
977 * After that, we cache every node we visit, using a single
978 * scan amortized over multiple lookups. This gives the best
978 * scan amortized over multiple lookups. This gives the best
979 * bulk performance, e.g. for "hg log".
979 * bulk performance, e.g. for "hg log".
980 */
980 */
981 if (self->ntmisses++ < 4) {
981 if (self->ntmisses++ < 4) {
982 for (rev = self->ntrev - 1; rev >= 0; rev--) {
982 for (rev = self->ntrev - 1; rev >= 0; rev--) {
983 const char *n = index_node(self, rev);
983 const char *n = index_node(self, rev);
984 if (n == NULL)
984 if (n == NULL)
985 return -2;
985 return -2;
986 if (memcmp(node, n, nodelen > 20 ? 20 : nodelen) == 0) {
986 if (memcmp(node, n, nodelen > 20 ? 20 : nodelen) == 0) {
987 if (nt_insert(self, n, rev) == -1)
987 if (nt_insert(self, n, rev) == -1)
988 return -3;
988 return -3;
989 break;
989 break;
990 }
990 }
991 }
991 }
992 } else {
992 } else {
993 for (rev = self->ntrev - 1; rev >= 0; rev--) {
993 for (rev = self->ntrev - 1; rev >= 0; rev--) {
994 const char *n = index_node(self, rev);
994 const char *n = index_node(self, rev);
995 if (n == NULL) {
995 if (n == NULL) {
996 self->ntrev = rev + 1;
996 self->ntrev = rev + 1;
997 return -2;
997 return -2;
998 }
998 }
999 if (nt_insert(self, n, rev) == -1) {
999 if (nt_insert(self, n, rev) == -1) {
1000 self->ntrev = rev + 1;
1000 self->ntrev = rev + 1;
1001 return -3;
1001 return -3;
1002 }
1002 }
1003 if (memcmp(node, n, nodelen > 20 ? 20 : nodelen) == 0) {
1003 if (memcmp(node, n, nodelen > 20 ? 20 : nodelen) == 0) {
1004 break;
1004 break;
1005 }
1005 }
1006 }
1006 }
1007 self->ntrev = rev;
1007 self->ntrev = rev;
1008 }
1008 }
1009
1009
1010 if (rev >= 0)
1010 if (rev >= 0)
1011 return rev;
1011 return rev;
1012 return -2;
1012 return -2;
1013 }
1013 }
1014
1014
1015 static PyObject *raise_revlog_error(void)
1015 static PyObject *raise_revlog_error(void)
1016 {
1016 {
1017 static PyObject *errclass;
1017 static PyObject *errclass;
1018 PyObject *mod = NULL, *errobj;
1018 PyObject *mod = NULL, *errobj;
1019
1019
1020 if (errclass == NULL) {
1020 if (errclass == NULL) {
1021 PyObject *dict;
1021 PyObject *dict;
1022
1022
1023 mod = PyImport_ImportModule("mercurial.error");
1023 mod = PyImport_ImportModule("mercurial.error");
1024 if (mod == NULL)
1024 if (mod == NULL)
1025 goto classfail;
1025 goto classfail;
1026
1026
1027 dict = PyModule_GetDict(mod);
1027 dict = PyModule_GetDict(mod);
1028 if (dict == NULL)
1028 if (dict == NULL)
1029 goto classfail;
1029 goto classfail;
1030
1030
1031 errclass = PyDict_GetItemString(dict, "RevlogError");
1031 errclass = PyDict_GetItemString(dict, "RevlogError");
1032 if (errclass == NULL) {
1032 if (errclass == NULL) {
1033 PyErr_SetString(PyExc_SystemError,
1033 PyErr_SetString(PyExc_SystemError,
1034 "could not find RevlogError");
1034 "could not find RevlogError");
1035 goto classfail;
1035 goto classfail;
1036 }
1036 }
1037 Py_INCREF(errclass);
1037 Py_INCREF(errclass);
1038 }
1038 }
1039
1039
1040 errobj = PyObject_CallFunction(errclass, NULL);
1040 errobj = PyObject_CallFunction(errclass, NULL);
1041 if (errobj == NULL)
1041 if (errobj == NULL)
1042 return NULL;
1042 return NULL;
1043 PyErr_SetObject(errclass, errobj);
1043 PyErr_SetObject(errclass, errobj);
1044 return errobj;
1044 return errobj;
1045
1045
1046 classfail:
1046 classfail:
1047 Py_XDECREF(mod);
1047 Py_XDECREF(mod);
1048 return NULL;
1048 return NULL;
1049 }
1049 }
1050
1050
1051 static PyObject *index_getitem(indexObject *self, PyObject *value)
1051 static PyObject *index_getitem(indexObject *self, PyObject *value)
1052 {
1052 {
1053 char *node;
1053 char *node;
1054 Py_ssize_t nodelen;
1054 Py_ssize_t nodelen;
1055 int rev;
1055 int rev;
1056
1056
1057 if (PyInt_Check(value))
1057 if (PyInt_Check(value))
1058 return index_get(self, PyInt_AS_LONG(value));
1058 return index_get(self, PyInt_AS_LONG(value));
1059
1059
1060 if (node_check(value, &node, &nodelen) == -1)
1060 if (node_check(value, &node, &nodelen) == -1)
1061 return NULL;
1061 return NULL;
1062 rev = index_find_node(self, node, nodelen);
1062 rev = index_find_node(self, node, nodelen);
1063 if (rev >= -1)
1063 if (rev >= -1)
1064 return PyInt_FromLong(rev);
1064 return PyInt_FromLong(rev);
1065 if (rev == -2)
1065 if (rev == -2)
1066 raise_revlog_error();
1066 raise_revlog_error();
1067 return NULL;
1067 return NULL;
1068 }
1068 }
1069
1069
1070 static int nt_partialmatch(indexObject *self, const char *node,
1070 static int nt_partialmatch(indexObject *self, const char *node,
1071 Py_ssize_t nodelen)
1071 Py_ssize_t nodelen)
1072 {
1072 {
1073 int rev;
1073 int rev;
1074
1074
1075 if (nt_init(self) == -1)
1075 if (nt_init(self) == -1)
1076 return -3;
1076 return -3;
1077
1077
1078 if (self->ntrev > 0) {
1078 if (self->ntrev > 0) {
1079 /* ensure that the radix tree is fully populated */
1079 /* ensure that the radix tree is fully populated */
1080 for (rev = self->ntrev - 1; rev >= 0; rev--) {
1080 for (rev = self->ntrev - 1; rev >= 0; rev--) {
1081 const char *n = index_node(self, rev);
1081 const char *n = index_node(self, rev);
1082 if (n == NULL)
1082 if (n == NULL)
1083 return -2;
1083 return -2;
1084 if (nt_insert(self, n, rev) == -1)
1084 if (nt_insert(self, n, rev) == -1)
1085 return -3;
1085 return -3;
1086 }
1086 }
1087 self->ntrev = rev;
1087 self->ntrev = rev;
1088 }
1088 }
1089
1089
1090 return nt_find(self, node, nodelen, 1);
1090 return nt_find(self, node, nodelen, 1);
1091 }
1091 }
1092
1092
1093 static PyObject *index_partialmatch(indexObject *self, PyObject *args)
1093 static PyObject *index_partialmatch(indexObject *self, PyObject *args)
1094 {
1094 {
1095 const char *fullnode;
1095 const char *fullnode;
1096 int nodelen;
1096 int nodelen;
1097 char *node;
1097 char *node;
1098 int rev, i;
1098 int rev, i;
1099
1099
1100 if (!PyArg_ParseTuple(args, "s#", &node, &nodelen))
1100 if (!PyArg_ParseTuple(args, "s#", &node, &nodelen))
1101 return NULL;
1101 return NULL;
1102
1102
1103 if (nodelen < 4) {
1103 if (nodelen < 4) {
1104 PyErr_SetString(PyExc_ValueError, "key too short");
1104 PyErr_SetString(PyExc_ValueError, "key too short");
1105 return NULL;
1105 return NULL;
1106 }
1106 }
1107
1107
1108 if (nodelen > 40) {
1108 if (nodelen > 40) {
1109 PyErr_SetString(PyExc_ValueError, "key too long");
1109 PyErr_SetString(PyExc_ValueError, "key too long");
1110 return NULL;
1110 return NULL;
1111 }
1111 }
1112
1112
1113 for (i = 0; i < nodelen; i++)
1113 for (i = 0; i < nodelen; i++)
1114 hexdigit(node, i);
1114 hexdigit(node, i);
1115 if (PyErr_Occurred()) {
1115 if (PyErr_Occurred()) {
1116 /* input contains non-hex characters */
1116 /* input contains non-hex characters */
1117 PyErr_Clear();
1117 PyErr_Clear();
1118 Py_RETURN_NONE;
1118 Py_RETURN_NONE;
1119 }
1119 }
1120
1120
1121 rev = nt_partialmatch(self, node, nodelen);
1121 rev = nt_partialmatch(self, node, nodelen);
1122
1122
1123 switch (rev) {
1123 switch (rev) {
1124 case -4:
1124 case -4:
1125 raise_revlog_error();
1125 raise_revlog_error();
1126 case -3:
1126 case -3:
1127 return NULL;
1127 return NULL;
1128 case -2:
1128 case -2:
1129 Py_RETURN_NONE;
1129 Py_RETURN_NONE;
1130 case -1:
1130 case -1:
1131 return PyString_FromStringAndSize(nullid, 20);
1131 return PyString_FromStringAndSize(nullid, 20);
1132 }
1132 }
1133
1133
1134 fullnode = index_node(self, rev);
1134 fullnode = index_node(self, rev);
1135 if (fullnode == NULL) {
1135 if (fullnode == NULL) {
1136 PyErr_Format(PyExc_IndexError,
1136 PyErr_Format(PyExc_IndexError,
1137 "could not access rev %d", rev);
1137 "could not access rev %d", rev);
1138 return NULL;
1138 return NULL;
1139 }
1139 }
1140 return PyString_FromStringAndSize(fullnode, 20);
1140 return PyString_FromStringAndSize(fullnode, 20);
1141 }
1141 }
1142
1142
1143 static PyObject *index_m_get(indexObject *self, PyObject *args)
1143 static PyObject *index_m_get(indexObject *self, PyObject *args)
1144 {
1144 {
1145 Py_ssize_t nodelen;
1145 Py_ssize_t nodelen;
1146 PyObject *val;
1146 PyObject *val;
1147 char *node;
1147 char *node;
1148 int rev;
1148 int rev;
1149
1149
1150 if (!PyArg_ParseTuple(args, "O", &val))
1150 if (!PyArg_ParseTuple(args, "O", &val))
1151 return NULL;
1151 return NULL;
1152 if (node_check(val, &node, &nodelen) == -1)
1152 if (node_check(val, &node, &nodelen) == -1)
1153 return NULL;
1153 return NULL;
1154 rev = index_find_node(self, node, nodelen);
1154 rev = index_find_node(self, node, nodelen);
1155 if (rev == -3)
1155 if (rev == -3)
1156 return NULL;
1156 return NULL;
1157 if (rev == -2)
1157 if (rev == -2)
1158 Py_RETURN_NONE;
1158 Py_RETURN_NONE;
1159 return PyInt_FromLong(rev);
1159 return PyInt_FromLong(rev);
1160 }
1160 }
1161
1161
1162 static int index_contains(indexObject *self, PyObject *value)
1162 static int index_contains(indexObject *self, PyObject *value)
1163 {
1163 {
1164 char *node;
1164 char *node;
1165 Py_ssize_t nodelen;
1165 Py_ssize_t nodelen;
1166
1166
1167 if (PyInt_Check(value)) {
1167 if (PyInt_Check(value)) {
1168 long rev = PyInt_AS_LONG(value);
1168 long rev = PyInt_AS_LONG(value);
1169 return rev >= -1 && rev < index_length(self);
1169 return rev >= -1 && rev < index_length(self);
1170 }
1170 }
1171
1171
1172 if (node_check(value, &node, &nodelen) == -1)
1172 if (node_check(value, &node, &nodelen) == -1)
1173 return -1;
1173 return -1;
1174
1174
1175 switch (index_find_node(self, node, nodelen)) {
1175 switch (index_find_node(self, node, nodelen)) {
1176 case -3:
1176 case -3:
1177 return -1;
1177 return -1;
1178 case -2:
1178 case -2:
1179 return 0;
1179 return 0;
1180 default:
1180 default:
1181 return 1;
1181 return 1;
1182 }
1182 }
1183 }
1183 }
1184
1184
1185 static inline void index_get_parents(indexObject *self, int rev, int *ps)
1185 static inline void index_get_parents(indexObject *self, int rev, int *ps)
1186 {
1186 {
1187 if (rev >= self->length - 1) {
1187 if (rev >= self->length - 1) {
1188 PyObject *tuple = PyList_GET_ITEM(self->added,
1188 PyObject *tuple = PyList_GET_ITEM(self->added,
1189 rev - self->length + 1);
1189 rev - self->length + 1);
1190 ps[0] = (int)PyInt_AS_LONG(PyTuple_GET_ITEM(tuple, 5));
1190 ps[0] = (int)PyInt_AS_LONG(PyTuple_GET_ITEM(tuple, 5));
1191 ps[1] = (int)PyInt_AS_LONG(PyTuple_GET_ITEM(tuple, 6));
1191 ps[1] = (int)PyInt_AS_LONG(PyTuple_GET_ITEM(tuple, 6));
1192 } else {
1192 } else {
1193 const char *data = index_deref(self, rev);
1193 const char *data = index_deref(self, rev);
1194 ps[0] = getbe32(data + 24);
1194 ps[0] = getbe32(data + 24);
1195 ps[1] = getbe32(data + 28);
1195 ps[1] = getbe32(data + 28);
1196 }
1196 }
1197 }
1197 }
1198
1198
1199 typedef uint64_t bitmask;
1199 typedef uint64_t bitmask;
1200
1200
1201 /*
1201 /*
1202 * Given a disjoint set of revs, return all candidates for the
1202 * Given a disjoint set of revs, return all candidates for the
1203 * greatest common ancestor. In revset notation, this is the set
1203 * greatest common ancestor. In revset notation, this is the set
1204 * "heads(::a and ::b and ...)"
1204 * "heads(::a and ::b and ...)"
1205 */
1205 */
1206 static PyObject *find_gca_candidates(indexObject *self, const int *revs,
1206 static PyObject *find_gca_candidates(indexObject *self, const int *revs,
1207 int revcount)
1207 int revcount)
1208 {
1208 {
1209 const bitmask allseen = (1ull << revcount) - 1;
1209 const bitmask allseen = (1ull << revcount) - 1;
1210 const bitmask poison = 1ull << revcount;
1210 const bitmask poison = 1ull << revcount;
1211 PyObject *gca = PyList_New(0);
1211 PyObject *gca = PyList_New(0);
1212 int i, v, interesting, left;
1212 int i, v, interesting, left;
1213 int maxrev = -1;
1213 int maxrev = -1;
1214 long sp;
1214 long sp;
1215 bitmask *seen;
1215 bitmask *seen;
1216
1216
1217 if (gca == NULL)
1217 if (gca == NULL)
1218 return PyErr_NoMemory();
1218 return PyErr_NoMemory();
1219
1219
1220 for (i = 0; i < revcount; i++) {
1220 for (i = 0; i < revcount; i++) {
1221 if (revs[i] > maxrev)
1221 if (revs[i] > maxrev)
1222 maxrev = revs[i];
1222 maxrev = revs[i];
1223 }
1223 }
1224
1224
1225 seen = calloc(sizeof(*seen), maxrev + 1);
1225 seen = calloc(sizeof(*seen), maxrev + 1);
1226 if (seen == NULL) {
1226 if (seen == NULL) {
1227 Py_DECREF(gca);
1227 Py_DECREF(gca);
1228 return PyErr_NoMemory();
1228 return PyErr_NoMemory();
1229 }
1229 }
1230
1230
1231 for (i = 0; i < revcount; i++)
1231 for (i = 0; i < revcount; i++)
1232 seen[revs[i]] = 1ull << i;
1232 seen[revs[i]] = 1ull << i;
1233
1233
1234 interesting = left = revcount;
1234 interesting = left = revcount;
1235
1235
1236 for (v = maxrev; v >= 0 && interesting; v--) {
1236 for (v = maxrev; v >= 0 && interesting; v--) {
1237 long sv = seen[v];
1237 long sv = seen[v];
1238 int parents[2];
1238 int parents[2];
1239
1239
1240 if (!sv)
1240 if (!sv)
1241 continue;
1241 continue;
1242
1242
1243 if (sv < poison) {
1243 if (sv < poison) {
1244 interesting -= 1;
1244 interesting -= 1;
1245 if (sv == allseen) {
1245 if (sv == allseen) {
1246 PyObject *obj = PyInt_FromLong(v);
1246 PyObject *obj = PyInt_FromLong(v);
1247 if (obj == NULL)
1247 if (obj == NULL)
1248 goto bail;
1248 goto bail;
1249 if (PyList_Append(gca, obj) == -1) {
1249 if (PyList_Append(gca, obj) == -1) {
1250 Py_DECREF(obj);
1250 Py_DECREF(obj);
1251 goto bail;
1251 goto bail;
1252 }
1252 }
1253 sv |= poison;
1253 sv |= poison;
1254 for (i = 0; i < revcount; i++) {
1254 for (i = 0; i < revcount; i++) {
1255 if (revs[i] == v) {
1255 if (revs[i] == v) {
1256 if (--left <= 1)
1256 if (--left <= 1)
1257 goto done;
1257 goto done;
1258 break;
1258 break;
1259 }
1259 }
1260 }
1260 }
1261 }
1261 }
1262 }
1262 }
1263 index_get_parents(self, v, parents);
1263 index_get_parents(self, v, parents);
1264
1264
1265 for (i = 0; i < 2; i++) {
1265 for (i = 0; i < 2; i++) {
1266 int p = parents[i];
1266 int p = parents[i];
1267 if (p == -1)
1267 if (p == -1)
1268 continue;
1268 continue;
1269 sp = seen[p];
1269 sp = seen[p];
1270 if (sv < poison) {
1270 if (sv < poison) {
1271 if (sp == 0) {
1271 if (sp == 0) {
1272 seen[p] = sv;
1272 seen[p] = sv;
1273 interesting++;
1273 interesting++;
1274 }
1274 }
1275 else if (sp != sv)
1275 else if (sp != sv)
1276 seen[p] |= sv;
1276 seen[p] |= sv;
1277 } else {
1277 } else {
1278 if (sp && sp < poison)
1278 if (sp && sp < poison)
1279 interesting--;
1279 interesting--;
1280 seen[p] = sv;
1280 seen[p] = sv;
1281 }
1281 }
1282 }
1282 }
1283 }
1283 }
1284
1284
1285 done:
1285 done:
1286 free(seen);
1286 free(seen);
1287 return gca;
1287 return gca;
1288 bail:
1288 bail:
1289 free(seen);
1289 free(seen);
1290 Py_XDECREF(gca);
1290 Py_XDECREF(gca);
1291 return NULL;
1291 return NULL;
1292 }
1292 }
1293
1293
1294 /*
1294 /*
1295 * Given a disjoint set of revs, return the subset with the longest
1295 * Given a disjoint set of revs, return the subset with the longest
1296 * path to the root.
1296 * path to the root.
1297 */
1297 */
1298 static PyObject *find_deepest(indexObject *self, PyObject *revs)
1298 static PyObject *find_deepest(indexObject *self, PyObject *revs)
1299 {
1299 {
1300 const Py_ssize_t revcount = PyList_GET_SIZE(revs);
1300 const Py_ssize_t revcount = PyList_GET_SIZE(revs);
1301 static const Py_ssize_t capacity = 24;
1301 static const Py_ssize_t capacity = 24;
1302 int *depth, *interesting = NULL;
1302 int *depth, *interesting = NULL;
1303 int i, j, v, ninteresting;
1303 int i, j, v, ninteresting;
1304 PyObject *dict = NULL, *keys;
1304 PyObject *dict = NULL, *keys;
1305 long *seen = NULL;
1305 long *seen = NULL;
1306 int maxrev = -1;
1306 int maxrev = -1;
1307 long final;
1307 long final;
1308
1308
1309 if (revcount > capacity) {
1309 if (revcount > capacity) {
1310 PyErr_Format(PyExc_OverflowError,
1310 PyErr_Format(PyExc_OverflowError,
1311 "bitset size (%ld) > capacity (%ld)",
1311 "bitset size (%ld) > capacity (%ld)",
1312 (long)revcount, (long)capacity);
1312 (long)revcount, (long)capacity);
1313 return NULL;
1313 return NULL;
1314 }
1314 }
1315
1315
1316 for (i = 0; i < revcount; i++) {
1316 for (i = 0; i < revcount; i++) {
1317 int n = (int)PyInt_AsLong(PyList_GET_ITEM(revs, i));
1317 int n = (int)PyInt_AsLong(PyList_GET_ITEM(revs, i));
1318 if (n > maxrev)
1318 if (n > maxrev)
1319 maxrev = n;
1319 maxrev = n;
1320 }
1320 }
1321
1321
1322 depth = calloc(sizeof(*depth), maxrev + 1);
1322 depth = calloc(sizeof(*depth), maxrev + 1);
1323 if (depth == NULL)
1323 if (depth == NULL)
1324 return PyErr_NoMemory();
1324 return PyErr_NoMemory();
1325
1325
1326 seen = calloc(sizeof(*seen), maxrev + 1);
1326 seen = calloc(sizeof(*seen), maxrev + 1);
1327 if (seen == NULL) {
1327 if (seen == NULL) {
1328 PyErr_NoMemory();
1328 PyErr_NoMemory();
1329 goto bail;
1329 goto bail;
1330 }
1330 }
1331
1331
1332 interesting = calloc(sizeof(*interesting), 2 << revcount);
1332 interesting = calloc(sizeof(*interesting), 2 << revcount);
1333 if (interesting == NULL) {
1333 if (interesting == NULL) {
1334 PyErr_NoMemory();
1334 PyErr_NoMemory();
1335 goto bail;
1335 goto bail;
1336 }
1336 }
1337
1337
1338 if (PyList_Sort(revs) == -1)
1338 if (PyList_Sort(revs) == -1)
1339 goto bail;
1339 goto bail;
1340
1340
1341 for (i = 0; i < revcount; i++) {
1341 for (i = 0; i < revcount; i++) {
1342 int n = (int)PyInt_AsLong(PyList_GET_ITEM(revs, i));
1342 int n = (int)PyInt_AsLong(PyList_GET_ITEM(revs, i));
1343 long b = 1l << i;
1343 long b = 1l << i;
1344 depth[n] = 1;
1344 depth[n] = 1;
1345 seen[n] = b;
1345 seen[n] = b;
1346 interesting[b] = 1;
1346 interesting[b] = 1;
1347 }
1347 }
1348
1348
1349 ninteresting = (int)revcount;
1349 ninteresting = (int)revcount;
1350
1350
1351 for (v = maxrev; v >= 0 && ninteresting > 1; v--) {
1351 for (v = maxrev; v >= 0 && ninteresting > 1; v--) {
1352 int dv = depth[v];
1352 int dv = depth[v];
1353 int parents[2];
1353 int parents[2];
1354 long sv;
1354 long sv;
1355
1355
1356 if (dv == 0)
1356 if (dv == 0)
1357 continue;
1357 continue;
1358
1358
1359 sv = seen[v];
1359 sv = seen[v];
1360 index_get_parents(self, v, parents);
1360 index_get_parents(self, v, parents);
1361
1361
1362 for (i = 0; i < 2; i++) {
1362 for (i = 0; i < 2; i++) {
1363 int p = parents[i];
1363 int p = parents[i];
1364 long nsp, sp;
1364 long nsp, sp;
1365 int dp;
1365 int dp;
1366
1366
1367 if (p == -1)
1367 if (p == -1)
1368 continue;
1368 continue;
1369
1369
1370 dp = depth[p];
1370 dp = depth[p];
1371 nsp = sp = seen[p];
1371 nsp = sp = seen[p];
1372 if (dp <= dv) {
1372 if (dp <= dv) {
1373 depth[p] = dv + 1;
1373 depth[p] = dv + 1;
1374 if (sp != sv) {
1374 if (sp != sv) {
1375 interesting[sv] += 1;
1375 interesting[sv] += 1;
1376 nsp = seen[p] = sv;
1376 nsp = seen[p] = sv;
1377 if (sp) {
1377 if (sp) {
1378 interesting[sp] -= 1;
1378 interesting[sp] -= 1;
1379 if (interesting[sp] == 0)
1379 if (interesting[sp] == 0)
1380 ninteresting -= 1;
1380 ninteresting -= 1;
1381 }
1381 }
1382 }
1382 }
1383 }
1383 }
1384 else if (dv == dp - 1) {
1384 else if (dv == dp - 1) {
1385 nsp = sp | sv;
1385 nsp = sp | sv;
1386 if (nsp == sp)
1386 if (nsp == sp)
1387 continue;
1387 continue;
1388 seen[p] = nsp;
1388 seen[p] = nsp;
1389 interesting[sp] -= 1;
1389 interesting[sp] -= 1;
1390 if (interesting[sp] == 0 && interesting[nsp] > 0)
1390 if (interesting[sp] == 0 && interesting[nsp] > 0)
1391 ninteresting -= 1;
1391 ninteresting -= 1;
1392 interesting[nsp] += 1;
1392 interesting[nsp] += 1;
1393 }
1393 }
1394 }
1394 }
1395 interesting[sv] -= 1;
1395 interesting[sv] -= 1;
1396 if (interesting[sv] == 0)
1396 if (interesting[sv] == 0)
1397 ninteresting -= 1;
1397 ninteresting -= 1;
1398 }
1398 }
1399
1399
1400 final = 0;
1400 final = 0;
1401 j = ninteresting;
1401 j = ninteresting;
1402 for (i = 0; i < (int)(2 << revcount) && j > 0; i++) {
1402 for (i = 0; i < (int)(2 << revcount) && j > 0; i++) {
1403 if (interesting[i] == 0)
1403 if (interesting[i] == 0)
1404 continue;
1404 continue;
1405 final |= i;
1405 final |= i;
1406 j -= 1;
1406 j -= 1;
1407 }
1407 }
1408 if (final == 0)
1408 if (final == 0)
1409 return PyList_New(0);
1409 return PyList_New(0);
1410
1410
1411 dict = PyDict_New();
1411 dict = PyDict_New();
1412 if (dict == NULL)
1412 if (dict == NULL)
1413 goto bail;
1413 goto bail;
1414
1414
1415 for (i = 0; i < revcount; i++) {
1415 for (i = 0; i < revcount; i++) {
1416 PyObject *key;
1416 PyObject *key;
1417
1417
1418 if ((final & (1 << i)) == 0)
1418 if ((final & (1 << i)) == 0)
1419 continue;
1419 continue;
1420
1420
1421 key = PyList_GET_ITEM(revs, i);
1421 key = PyList_GET_ITEM(revs, i);
1422 Py_INCREF(key);
1422 Py_INCREF(key);
1423 Py_INCREF(Py_None);
1423 Py_INCREF(Py_None);
1424 if (PyDict_SetItem(dict, key, Py_None) == -1) {
1424 if (PyDict_SetItem(dict, key, Py_None) == -1) {
1425 Py_DECREF(key);
1425 Py_DECREF(key);
1426 Py_DECREF(Py_None);
1426 Py_DECREF(Py_None);
1427 goto bail;
1427 goto bail;
1428 }
1428 }
1429 }
1429 }
1430
1430
1431 keys = PyDict_Keys(dict);
1431 keys = PyDict_Keys(dict);
1432
1432
1433 free(depth);
1433 free(depth);
1434 free(seen);
1434 free(seen);
1435 free(interesting);
1435 free(interesting);
1436 Py_DECREF(dict);
1436 Py_DECREF(dict);
1437
1437
1438 return keys;
1438 return keys;
1439 bail:
1439 bail:
1440 free(depth);
1440 free(depth);
1441 free(seen);
1441 free(seen);
1442 free(interesting);
1442 free(interesting);
1443 Py_XDECREF(dict);
1443 Py_XDECREF(dict);
1444
1444
1445 return NULL;
1445 return NULL;
1446 }
1446 }
1447
1447
1448 /*
1448 /*
1449 * Given a (possibly overlapping) set of revs, return the greatest
1449 * Given a (possibly overlapping) set of revs, return the greatest
1450 * common ancestors: those with the longest path to the root.
1450 * common ancestors: those with the longest path to the root.
1451 */
1451 */
1452 static PyObject *index_ancestors(indexObject *self, PyObject *args)
1452 static PyObject *index_ancestors(indexObject *self, PyObject *args)
1453 {
1453 {
1454 PyObject *ret = NULL, *gca = NULL;
1454 PyObject *ret = NULL, *gca = NULL;
1455 Py_ssize_t argcount, i, len;
1455 Py_ssize_t argcount, i, len;
1456 bitmask repeat = 0;
1456 bitmask repeat = 0;
1457 int revcount = 0;
1457 int revcount = 0;
1458 int *revs;
1458 int *revs;
1459
1459
1460 argcount = PySequence_Length(args);
1460 argcount = PySequence_Length(args);
1461 revs = malloc(argcount * sizeof(*revs));
1461 revs = malloc(argcount * sizeof(*revs));
1462 if (argcount > 0 && revs == NULL)
1462 if (argcount > 0 && revs == NULL)
1463 return PyErr_NoMemory();
1463 return PyErr_NoMemory();
1464 len = index_length(self) - 1;
1464 len = index_length(self) - 1;
1465
1465
1466 for (i = 0; i < argcount; i++) {
1466 for (i = 0; i < argcount; i++) {
1467 static const int capacity = 24;
1467 static const int capacity = 24;
1468 PyObject *obj = PySequence_GetItem(args, i);
1468 PyObject *obj = PySequence_GetItem(args, i);
1469 bitmask x;
1469 bitmask x;
1470 long val;
1470 long val;
1471
1471
1472 if (!PyInt_Check(obj)) {
1472 if (!PyInt_Check(obj)) {
1473 PyErr_SetString(PyExc_TypeError,
1473 PyErr_SetString(PyExc_TypeError,
1474 "arguments must all be ints");
1474 "arguments must all be ints");
1475 goto bail;
1475 goto bail;
1476 }
1476 }
1477 val = PyInt_AsLong(obj);
1477 val = PyInt_AsLong(obj);
1478 if (val == -1) {
1478 if (val == -1) {
1479 ret = PyList_New(0);
1479 ret = PyList_New(0);
1480 goto done;
1480 goto done;
1481 }
1481 }
1482 if (val < 0 || val >= len) {
1482 if (val < 0 || val >= len) {
1483 PyErr_SetString(PyExc_IndexError,
1483 PyErr_SetString(PyExc_IndexError,
1484 "index out of range");
1484 "index out of range");
1485 goto bail;
1485 goto bail;
1486 }
1486 }
1487 /* this cheesy bloom filter lets us avoid some more
1487 /* this cheesy bloom filter lets us avoid some more
1488 * expensive duplicate checks in the common set-is-disjoint
1488 * expensive duplicate checks in the common set-is-disjoint
1489 * case */
1489 * case */
1490 x = 1ull << (val & 0x3f);
1490 x = 1ull << (val & 0x3f);
1491 if (repeat & x) {
1491 if (repeat & x) {
1492 int k;
1492 int k;
1493 for (k = 0; k < revcount; k++) {
1493 for (k = 0; k < revcount; k++) {
1494 if (val == revs[k])
1494 if (val == revs[k])
1495 goto duplicate;
1495 goto duplicate;
1496 }
1496 }
1497 }
1497 }
1498 else repeat |= x;
1498 else repeat |= x;
1499 if (revcount >= capacity) {
1499 if (revcount >= capacity) {
1500 PyErr_Format(PyExc_OverflowError,
1500 PyErr_Format(PyExc_OverflowError,
1501 "bitset size (%d) > capacity (%d)",
1501 "bitset size (%d) > capacity (%d)",
1502 revcount, capacity);
1502 revcount, capacity);
1503 goto bail;
1503 goto bail;
1504 }
1504 }
1505 revs[revcount++] = (int)val;
1505 revs[revcount++] = (int)val;
1506 duplicate:;
1506 duplicate:;
1507 }
1507 }
1508
1508
1509 if (revcount == 0) {
1509 if (revcount == 0) {
1510 ret = PyList_New(0);
1510 ret = PyList_New(0);
1511 goto done;
1511 goto done;
1512 }
1512 }
1513 if (revcount == 1) {
1513 if (revcount == 1) {
1514 PyObject *obj;
1514 PyObject *obj;
1515 ret = PyList_New(1);
1515 ret = PyList_New(1);
1516 if (ret == NULL)
1516 if (ret == NULL)
1517 goto bail;
1517 goto bail;
1518 obj = PyInt_FromLong(revs[0]);
1518 obj = PyInt_FromLong(revs[0]);
1519 if (obj == NULL)
1519 if (obj == NULL)
1520 goto bail;
1520 goto bail;
1521 PyList_SET_ITEM(ret, 0, obj);
1521 PyList_SET_ITEM(ret, 0, obj);
1522 goto done;
1522 goto done;
1523 }
1523 }
1524
1524
1525 gca = find_gca_candidates(self, revs, revcount);
1525 gca = find_gca_candidates(self, revs, revcount);
1526 if (gca == NULL)
1526 if (gca == NULL)
1527 goto bail;
1527 goto bail;
1528
1528
1529 if (PyList_GET_SIZE(gca) <= 1) {
1529 if (PyList_GET_SIZE(gca) <= 1) {
1530 ret = gca;
1530 ret = gca;
1531 Py_INCREF(gca);
1531 Py_INCREF(gca);
1532 }
1532 }
1533 else if (PyList_GET_SIZE(gca) == 1) {
1533 else if (PyList_GET_SIZE(gca) == 1) {
1534 ret = PyList_GET_ITEM(gca, 0);
1534 ret = PyList_GET_ITEM(gca, 0);
1535 Py_INCREF(ret);
1535 Py_INCREF(ret);
1536 }
1536 }
1537 else ret = find_deepest(self, gca);
1537 else ret = find_deepest(self, gca);
1538
1538
1539 done:
1539 done:
1540 free(revs);
1540 free(revs);
1541 Py_XDECREF(gca);
1541 Py_XDECREF(gca);
1542
1542
1543 return ret;
1543 return ret;
1544
1544
1545 bail:
1545 bail:
1546 free(revs);
1546 free(revs);
1547 Py_XDECREF(gca);
1547 Py_XDECREF(gca);
1548 Py_XDECREF(ret);
1548 Py_XDECREF(ret);
1549 return NULL;
1549 return NULL;
1550 }
1550 }
1551
1551
1552 /*
1552 /*
1553 * Invalidate any trie entries introduced by added revs.
1553 * Invalidate any trie entries introduced by added revs.
1554 */
1554 */
1555 static void nt_invalidate_added(indexObject *self, Py_ssize_t start)
1555 static void nt_invalidate_added(indexObject *self, Py_ssize_t start)
1556 {
1556 {
1557 Py_ssize_t i, len = PyList_GET_SIZE(self->added);
1557 Py_ssize_t i, len = PyList_GET_SIZE(self->added);
1558
1558
1559 for (i = start; i < len; i++) {
1559 for (i = start; i < len; i++) {
1560 PyObject *tuple = PyList_GET_ITEM(self->added, i);
1560 PyObject *tuple = PyList_GET_ITEM(self->added, i);
1561 PyObject *node = PyTuple_GET_ITEM(tuple, 7);
1561 PyObject *node = PyTuple_GET_ITEM(tuple, 7);
1562
1562
1563 nt_insert(self, PyString_AS_STRING(node), -1);
1563 nt_insert(self, PyString_AS_STRING(node), -1);
1564 }
1564 }
1565
1565
1566 if (start == 0)
1566 if (start == 0)
1567 Py_CLEAR(self->added);
1567 Py_CLEAR(self->added);
1568 }
1568 }
1569
1569
1570 /*
1570 /*
1571 * Delete a numeric range of revs, which must be at the end of the
1571 * Delete a numeric range of revs, which must be at the end of the
1572 * range, but exclude the sentinel nullid entry.
1572 * range, but exclude the sentinel nullid entry.
1573 */
1573 */
1574 static int index_slice_del(indexObject *self, PyObject *item)
1574 static int index_slice_del(indexObject *self, PyObject *item)
1575 {
1575 {
1576 Py_ssize_t start, stop, step, slicelength;
1576 Py_ssize_t start, stop, step, slicelength;
1577 Py_ssize_t length = index_length(self);
1577 Py_ssize_t length = index_length(self);
1578 int ret = 0;
1578 int ret = 0;
1579
1579
1580 if (PySlice_GetIndicesEx((PySliceObject*)item, length,
1580 if (PySlice_GetIndicesEx((PySliceObject*)item, length,
1581 &start, &stop, &step, &slicelength) < 0)
1581 &start, &stop, &step, &slicelength) < 0)
1582 return -1;
1582 return -1;
1583
1583
1584 if (slicelength <= 0)
1584 if (slicelength <= 0)
1585 return 0;
1585 return 0;
1586
1586
1587 if ((step < 0 && start < stop) || (step > 0 && start > stop))
1587 if ((step < 0 && start < stop) || (step > 0 && start > stop))
1588 stop = start;
1588 stop = start;
1589
1589
1590 if (step < 0) {
1590 if (step < 0) {
1591 stop = start + 1;
1591 stop = start + 1;
1592 start = stop + step*(slicelength - 1) - 1;
1592 start = stop + step*(slicelength - 1) - 1;
1593 step = -step;
1593 step = -step;
1594 }
1594 }
1595
1595
1596 if (step != 1) {
1596 if (step != 1) {
1597 PyErr_SetString(PyExc_ValueError,
1597 PyErr_SetString(PyExc_ValueError,
1598 "revlog index delete requires step size of 1");
1598 "revlog index delete requires step size of 1");
1599 return -1;
1599 return -1;
1600 }
1600 }
1601
1601
1602 if (stop != length - 1) {
1602 if (stop != length - 1) {
1603 PyErr_SetString(PyExc_IndexError,
1603 PyErr_SetString(PyExc_IndexError,
1604 "revlog index deletion indices are invalid");
1604 "revlog index deletion indices are invalid");
1605 return -1;
1605 return -1;
1606 }
1606 }
1607
1607
1608 if (start < self->length - 1) {
1608 if (start < self->length - 1) {
1609 if (self->nt) {
1609 if (self->nt) {
1610 Py_ssize_t i;
1610 Py_ssize_t i;
1611
1611
1612 for (i = start + 1; i < self->length - 1; i++) {
1612 for (i = start + 1; i < self->length - 1; i++) {
1613 const char *node = index_node(self, i);
1613 const char *node = index_node(self, i);
1614
1614
1615 if (node)
1615 if (node)
1616 nt_insert(self, node, -1);
1616 nt_insert(self, node, -1);
1617 }
1617 }
1618 if (self->added)
1618 if (self->added)
1619 nt_invalidate_added(self, 0);
1619 nt_invalidate_added(self, 0);
1620 if (self->ntrev > start)
1620 if (self->ntrev > start)
1621 self->ntrev = (int)start;
1621 self->ntrev = (int)start;
1622 }
1622 }
1623 self->length = start + 1;
1623 self->length = start + 1;
1624 if (start < self->raw_length) {
1624 if (start < self->raw_length) {
1625 if (self->cache) {
1625 if (self->cache) {
1626 Py_ssize_t i;
1626 Py_ssize_t i;
1627 for (i = start; i < self->raw_length; i++)
1627 for (i = start; i < self->raw_length; i++)
1628 Py_CLEAR(self->cache[i]);
1628 Py_CLEAR(self->cache[i]);
1629 }
1629 }
1630 self->raw_length = start;
1630 self->raw_length = start;
1631 }
1631 }
1632 goto done;
1632 goto done;
1633 }
1633 }
1634
1634
1635 if (self->nt) {
1635 if (self->nt) {
1636 nt_invalidate_added(self, start - self->length + 1);
1636 nt_invalidate_added(self, start - self->length + 1);
1637 if (self->ntrev > start)
1637 if (self->ntrev > start)
1638 self->ntrev = (int)start;
1638 self->ntrev = (int)start;
1639 }
1639 }
1640 if (self->added)
1640 if (self->added)
1641 ret = PyList_SetSlice(self->added, start - self->length + 1,
1641 ret = PyList_SetSlice(self->added, start - self->length + 1,
1642 PyList_GET_SIZE(self->added), NULL);
1642 PyList_GET_SIZE(self->added), NULL);
1643 done:
1643 done:
1644 Py_CLEAR(self->headrevs);
1644 Py_CLEAR(self->headrevs);
1645 return ret;
1645 return ret;
1646 }
1646 }
1647
1647
1648 /*
1648 /*
1649 * Supported ops:
1649 * Supported ops:
1650 *
1650 *
1651 * slice deletion
1651 * slice deletion
1652 * string assignment (extend node->rev mapping)
1652 * string assignment (extend node->rev mapping)
1653 * string deletion (shrink node->rev mapping)
1653 * string deletion (shrink node->rev mapping)
1654 */
1654 */
1655 static int index_assign_subscript(indexObject *self, PyObject *item,
1655 static int index_assign_subscript(indexObject *self, PyObject *item,
1656 PyObject *value)
1656 PyObject *value)
1657 {
1657 {
1658 char *node;
1658 char *node;
1659 Py_ssize_t nodelen;
1659 Py_ssize_t nodelen;
1660 long rev;
1660 long rev;
1661
1661
1662 if (PySlice_Check(item) && value == NULL)
1662 if (PySlice_Check(item) && value == NULL)
1663 return index_slice_del(self, item);
1663 return index_slice_del(self, item);
1664
1664
1665 if (node_check(item, &node, &nodelen) == -1)
1665 if (node_check(item, &node, &nodelen) == -1)
1666 return -1;
1666 return -1;
1667
1667
1668 if (value == NULL)
1668 if (value == NULL)
1669 return self->nt ? nt_insert(self, node, -1) : 0;
1669 return self->nt ? nt_insert(self, node, -1) : 0;
1670 rev = PyInt_AsLong(value);
1670 rev = PyInt_AsLong(value);
1671 if (rev > INT_MAX || rev < 0) {
1671 if (rev > INT_MAX || rev < 0) {
1672 if (!PyErr_Occurred())
1672 if (!PyErr_Occurred())
1673 PyErr_SetString(PyExc_ValueError, "rev out of range");
1673 PyErr_SetString(PyExc_ValueError, "rev out of range");
1674 return -1;
1674 return -1;
1675 }
1675 }
1676 return nt_insert(self, node, (int)rev);
1676 return nt_insert(self, node, (int)rev);
1677 }
1677 }
1678
1678
1679 /*
1679 /*
1680 * Find all RevlogNG entries in an index that has inline data. Update
1680 * Find all RevlogNG entries in an index that has inline data. Update
1681 * the optional "offsets" table with those entries.
1681 * the optional "offsets" table with those entries.
1682 */
1682 */
1683 static long inline_scan(indexObject *self, const char **offsets)
1683 static long inline_scan(indexObject *self, const char **offsets)
1684 {
1684 {
1685 const char *data = PyString_AS_STRING(self->data);
1685 const char *data = PyString_AS_STRING(self->data);
1686 const char *end = data + PyString_GET_SIZE(self->data);
1686 const char *end = data + PyString_GET_SIZE(self->data);
1687 long incr = v1_hdrsize;
1687 long incr = v1_hdrsize;
1688 Py_ssize_t len = 0;
1688 Py_ssize_t len = 0;
1689
1689
1690 while (data + v1_hdrsize <= end) {
1690 while (data + v1_hdrsize <= end) {
1691 uint32_t comp_len;
1691 uint32_t comp_len;
1692 const char *old_data;
1692 const char *old_data;
1693 /* 3rd element of header is length of compressed inline data */
1693 /* 3rd element of header is length of compressed inline data */
1694 comp_len = getbe32(data + 8);
1694 comp_len = getbe32(data + 8);
1695 incr = v1_hdrsize + comp_len;
1695 incr = v1_hdrsize + comp_len;
1696 if (incr < v1_hdrsize)
1696 if (incr < v1_hdrsize)
1697 break;
1697 break;
1698 if (offsets)
1698 if (offsets)
1699 offsets[len] = data;
1699 offsets[len] = data;
1700 len++;
1700 len++;
1701 old_data = data;
1701 old_data = data;
1702 data += incr;
1702 data += incr;
1703 if (data <= old_data)
1703 if (data <= old_data)
1704 break;
1704 break;
1705 }
1705 }
1706
1706
1707 if (data != end && data + v1_hdrsize != end) {
1707 if (data != end && data + v1_hdrsize != end) {
1708 if (!PyErr_Occurred())
1708 if (!PyErr_Occurred())
1709 PyErr_SetString(PyExc_ValueError, "corrupt index file");
1709 PyErr_SetString(PyExc_ValueError, "corrupt index file");
1710 return -1;
1710 return -1;
1711 }
1711 }
1712
1712
1713 return len;
1713 return len;
1714 }
1714 }
1715
1715
1716 static int index_init(indexObject *self, PyObject *args)
1716 static int index_init(indexObject *self, PyObject *args)
1717 {
1717 {
1718 PyObject *data_obj, *inlined_obj;
1718 PyObject *data_obj, *inlined_obj;
1719 Py_ssize_t size;
1719 Py_ssize_t size;
1720
1720
1721 /* Initialize before argument-checking to avoid index_dealloc() crash. */
1722 self->raw_length = 0;
1723 self->added = NULL;
1724 self->cache = NULL;
1725 self->data = NULL;
1726 self->headrevs = NULL;
1727 self->nt = NULL;
1728 self->offsets = NULL;
1729
1721 if (!PyArg_ParseTuple(args, "OO", &data_obj, &inlined_obj))
1730 if (!PyArg_ParseTuple(args, "OO", &data_obj, &inlined_obj))
1722 return -1;
1731 return -1;
1723 if (!PyString_Check(data_obj)) {
1732 if (!PyString_Check(data_obj)) {
1724 PyErr_SetString(PyExc_TypeError, "data is not a string");
1733 PyErr_SetString(PyExc_TypeError, "data is not a string");
1725 return -1;
1734 return -1;
1726 }
1735 }
1727 size = PyString_GET_SIZE(data_obj);
1736 size = PyString_GET_SIZE(data_obj);
1728
1737
1729 self->inlined = inlined_obj && PyObject_IsTrue(inlined_obj);
1738 self->inlined = inlined_obj && PyObject_IsTrue(inlined_obj);
1730 self->data = data_obj;
1739 self->data = data_obj;
1731 self->cache = NULL;
1732
1740
1733 self->added = NULL;
1734 self->headrevs = NULL;
1735 self->offsets = NULL;
1736 self->nt = NULL;
1737 self->ntlength = self->ntcapacity = 0;
1741 self->ntlength = self->ntcapacity = 0;
1738 self->ntdepth = self->ntsplits = 0;
1742 self->ntdepth = self->ntsplits = 0;
1739 self->ntlookups = self->ntmisses = 0;
1743 self->ntlookups = self->ntmisses = 0;
1740 self->ntrev = -1;
1744 self->ntrev = -1;
1741 Py_INCREF(self->data);
1745 Py_INCREF(self->data);
1742
1746
1743 if (self->inlined) {
1747 if (self->inlined) {
1744 long len = inline_scan(self, NULL);
1748 long len = inline_scan(self, NULL);
1745 if (len == -1)
1749 if (len == -1)
1746 goto bail;
1750 goto bail;
1747 self->raw_length = len;
1751 self->raw_length = len;
1748 self->length = len + 1;
1752 self->length = len + 1;
1749 } else {
1753 } else {
1750 if (size % v1_hdrsize) {
1754 if (size % v1_hdrsize) {
1751 PyErr_SetString(PyExc_ValueError, "corrupt index file");
1755 PyErr_SetString(PyExc_ValueError, "corrupt index file");
1752 goto bail;
1756 goto bail;
1753 }
1757 }
1754 self->raw_length = size / v1_hdrsize;
1758 self->raw_length = size / v1_hdrsize;
1755 self->length = self->raw_length + 1;
1759 self->length = self->raw_length + 1;
1756 }
1760 }
1757
1761
1758 return 0;
1762 return 0;
1759 bail:
1763 bail:
1760 return -1;
1764 return -1;
1761 }
1765 }
1762
1766
1763 static PyObject *index_nodemap(indexObject *self)
1767 static PyObject *index_nodemap(indexObject *self)
1764 {
1768 {
1765 Py_INCREF(self);
1769 Py_INCREF(self);
1766 return (PyObject *)self;
1770 return (PyObject *)self;
1767 }
1771 }
1768
1772
1769 static void index_dealloc(indexObject *self)
1773 static void index_dealloc(indexObject *self)
1770 {
1774 {
1771 _index_clearcaches(self);
1775 _index_clearcaches(self);
1772 Py_DECREF(self->data);
1776 Py_XDECREF(self->data);
1773 Py_XDECREF(self->added);
1777 Py_XDECREF(self->added);
1774 PyObject_Del(self);
1778 PyObject_Del(self);
1775 }
1779 }
1776
1780
1777 static PySequenceMethods index_sequence_methods = {
1781 static PySequenceMethods index_sequence_methods = {
1778 (lenfunc)index_length, /* sq_length */
1782 (lenfunc)index_length, /* sq_length */
1779 0, /* sq_concat */
1783 0, /* sq_concat */
1780 0, /* sq_repeat */
1784 0, /* sq_repeat */
1781 (ssizeargfunc)index_get, /* sq_item */
1785 (ssizeargfunc)index_get, /* sq_item */
1782 0, /* sq_slice */
1786 0, /* sq_slice */
1783 0, /* sq_ass_item */
1787 0, /* sq_ass_item */
1784 0, /* sq_ass_slice */
1788 0, /* sq_ass_slice */
1785 (objobjproc)index_contains, /* sq_contains */
1789 (objobjproc)index_contains, /* sq_contains */
1786 };
1790 };
1787
1791
1788 static PyMappingMethods index_mapping_methods = {
1792 static PyMappingMethods index_mapping_methods = {
1789 (lenfunc)index_length, /* mp_length */
1793 (lenfunc)index_length, /* mp_length */
1790 (binaryfunc)index_getitem, /* mp_subscript */
1794 (binaryfunc)index_getitem, /* mp_subscript */
1791 (objobjargproc)index_assign_subscript, /* mp_ass_subscript */
1795 (objobjargproc)index_assign_subscript, /* mp_ass_subscript */
1792 };
1796 };
1793
1797
1794 static PyMethodDef index_methods[] = {
1798 static PyMethodDef index_methods[] = {
1795 {"ancestors", (PyCFunction)index_ancestors, METH_VARARGS,
1799 {"ancestors", (PyCFunction)index_ancestors, METH_VARARGS,
1796 "return the gca set of the given revs"},
1800 "return the gca set of the given revs"},
1797 {"clearcaches", (PyCFunction)index_clearcaches, METH_NOARGS,
1801 {"clearcaches", (PyCFunction)index_clearcaches, METH_NOARGS,
1798 "clear the index caches"},
1802 "clear the index caches"},
1799 {"get", (PyCFunction)index_m_get, METH_VARARGS,
1803 {"get", (PyCFunction)index_m_get, METH_VARARGS,
1800 "get an index entry"},
1804 "get an index entry"},
1801 {"headrevs", (PyCFunction)index_headrevs, METH_NOARGS,
1805 {"headrevs", (PyCFunction)index_headrevs, METH_NOARGS,
1802 "get head revisions"},
1806 "get head revisions"},
1803 {"insert", (PyCFunction)index_insert, METH_VARARGS,
1807 {"insert", (PyCFunction)index_insert, METH_VARARGS,
1804 "insert an index entry"},
1808 "insert an index entry"},
1805 {"partialmatch", (PyCFunction)index_partialmatch, METH_VARARGS,
1809 {"partialmatch", (PyCFunction)index_partialmatch, METH_VARARGS,
1806 "match a potentially ambiguous node ID"},
1810 "match a potentially ambiguous node ID"},
1807 {"stats", (PyCFunction)index_stats, METH_NOARGS,
1811 {"stats", (PyCFunction)index_stats, METH_NOARGS,
1808 "stats for the index"},
1812 "stats for the index"},
1809 {NULL} /* Sentinel */
1813 {NULL} /* Sentinel */
1810 };
1814 };
1811
1815
1812 static PyGetSetDef index_getset[] = {
1816 static PyGetSetDef index_getset[] = {
1813 {"nodemap", (getter)index_nodemap, NULL, "nodemap", NULL},
1817 {"nodemap", (getter)index_nodemap, NULL, "nodemap", NULL},
1814 {NULL} /* Sentinel */
1818 {NULL} /* Sentinel */
1815 };
1819 };
1816
1820
1817 static PyTypeObject indexType = {
1821 static PyTypeObject indexType = {
1818 PyObject_HEAD_INIT(NULL)
1822 PyObject_HEAD_INIT(NULL)
1819 0, /* ob_size */
1823 0, /* ob_size */
1820 "parsers.index", /* tp_name */
1824 "parsers.index", /* tp_name */
1821 sizeof(indexObject), /* tp_basicsize */
1825 sizeof(indexObject), /* tp_basicsize */
1822 0, /* tp_itemsize */
1826 0, /* tp_itemsize */
1823 (destructor)index_dealloc, /* tp_dealloc */
1827 (destructor)index_dealloc, /* tp_dealloc */
1824 0, /* tp_print */
1828 0, /* tp_print */
1825 0, /* tp_getattr */
1829 0, /* tp_getattr */
1826 0, /* tp_setattr */
1830 0, /* tp_setattr */
1827 0, /* tp_compare */
1831 0, /* tp_compare */
1828 0, /* tp_repr */
1832 0, /* tp_repr */
1829 0, /* tp_as_number */
1833 0, /* tp_as_number */
1830 &index_sequence_methods, /* tp_as_sequence */
1834 &index_sequence_methods, /* tp_as_sequence */
1831 &index_mapping_methods, /* tp_as_mapping */
1835 &index_mapping_methods, /* tp_as_mapping */
1832 0, /* tp_hash */
1836 0, /* tp_hash */
1833 0, /* tp_call */
1837 0, /* tp_call */
1834 0, /* tp_str */
1838 0, /* tp_str */
1835 0, /* tp_getattro */
1839 0, /* tp_getattro */
1836 0, /* tp_setattro */
1840 0, /* tp_setattro */
1837 0, /* tp_as_buffer */
1841 0, /* tp_as_buffer */
1838 Py_TPFLAGS_DEFAULT, /* tp_flags */
1842 Py_TPFLAGS_DEFAULT, /* tp_flags */
1839 "revlog index", /* tp_doc */
1843 "revlog index", /* tp_doc */
1840 0, /* tp_traverse */
1844 0, /* tp_traverse */
1841 0, /* tp_clear */
1845 0, /* tp_clear */
1842 0, /* tp_richcompare */
1846 0, /* tp_richcompare */
1843 0, /* tp_weaklistoffset */
1847 0, /* tp_weaklistoffset */
1844 0, /* tp_iter */
1848 0, /* tp_iter */
1845 0, /* tp_iternext */
1849 0, /* tp_iternext */
1846 index_methods, /* tp_methods */
1850 index_methods, /* tp_methods */
1847 0, /* tp_members */
1851 0, /* tp_members */
1848 index_getset, /* tp_getset */
1852 index_getset, /* tp_getset */
1849 0, /* tp_base */
1853 0, /* tp_base */
1850 0, /* tp_dict */
1854 0, /* tp_dict */
1851 0, /* tp_descr_get */
1855 0, /* tp_descr_get */
1852 0, /* tp_descr_set */
1856 0, /* tp_descr_set */
1853 0, /* tp_dictoffset */
1857 0, /* tp_dictoffset */
1854 (initproc)index_init, /* tp_init */
1858 (initproc)index_init, /* tp_init */
1855 0, /* tp_alloc */
1859 0, /* tp_alloc */
1856 };
1860 };
1857
1861
1858 /*
1862 /*
1859 * returns a tuple of the form (index, index, cache) with elements as
1863 * returns a tuple of the form (index, index, cache) with elements as
1860 * follows:
1864 * follows:
1861 *
1865 *
1862 * index: an index object that lazily parses RevlogNG records
1866 * index: an index object that lazily parses RevlogNG records
1863 * cache: if data is inlined, a tuple (index_file_content, 0), else None
1867 * cache: if data is inlined, a tuple (index_file_content, 0), else None
1864 *
1868 *
1865 * added complications are for backwards compatibility
1869 * added complications are for backwards compatibility
1866 */
1870 */
1867 static PyObject *parse_index2(PyObject *self, PyObject *args)
1871 static PyObject *parse_index2(PyObject *self, PyObject *args)
1868 {
1872 {
1869 PyObject *tuple = NULL, *cache = NULL;
1873 PyObject *tuple = NULL, *cache = NULL;
1870 indexObject *idx;
1874 indexObject *idx;
1871 int ret;
1875 int ret;
1872
1876
1873 idx = PyObject_New(indexObject, &indexType);
1877 idx = PyObject_New(indexObject, &indexType);
1874 if (idx == NULL)
1878 if (idx == NULL)
1875 goto bail;
1879 goto bail;
1876
1880
1877 ret = index_init(idx, args);
1881 ret = index_init(idx, args);
1878 if (ret == -1)
1882 if (ret == -1)
1879 goto bail;
1883 goto bail;
1880
1884
1881 if (idx->inlined) {
1885 if (idx->inlined) {
1882 cache = Py_BuildValue("iO", 0, idx->data);
1886 cache = Py_BuildValue("iO", 0, idx->data);
1883 if (cache == NULL)
1887 if (cache == NULL)
1884 goto bail;
1888 goto bail;
1885 } else {
1889 } else {
1886 cache = Py_None;
1890 cache = Py_None;
1887 Py_INCREF(cache);
1891 Py_INCREF(cache);
1888 }
1892 }
1889
1893
1890 tuple = Py_BuildValue("NN", idx, cache);
1894 tuple = Py_BuildValue("NN", idx, cache);
1891 if (!tuple)
1895 if (!tuple)
1892 goto bail;
1896 goto bail;
1893 return tuple;
1897 return tuple;
1894
1898
1895 bail:
1899 bail:
1896 Py_XDECREF(idx);
1900 Py_XDECREF(idx);
1897 Py_XDECREF(cache);
1901 Py_XDECREF(cache);
1898 Py_XDECREF(tuple);
1902 Py_XDECREF(tuple);
1899 return NULL;
1903 return NULL;
1900 }
1904 }
1901
1905
1902 static char parsers_doc[] = "Efficient content parsing.";
1906 static char parsers_doc[] = "Efficient content parsing.";
1903
1907
1904 PyObject *encodedir(PyObject *self, PyObject *args);
1908 PyObject *encodedir(PyObject *self, PyObject *args);
1905 PyObject *pathencode(PyObject *self, PyObject *args);
1909 PyObject *pathencode(PyObject *self, PyObject *args);
1906 PyObject *lowerencode(PyObject *self, PyObject *args);
1910 PyObject *lowerencode(PyObject *self, PyObject *args);
1907
1911
1908 static PyMethodDef methods[] = {
1912 static PyMethodDef methods[] = {
1909 {"pack_dirstate", pack_dirstate, METH_VARARGS, "pack a dirstate\n"},
1913 {"pack_dirstate", pack_dirstate, METH_VARARGS, "pack a dirstate\n"},
1910 {"parse_manifest", parse_manifest, METH_VARARGS, "parse a manifest\n"},
1914 {"parse_manifest", parse_manifest, METH_VARARGS, "parse a manifest\n"},
1911 {"parse_dirstate", parse_dirstate, METH_VARARGS, "parse a dirstate\n"},
1915 {"parse_dirstate", parse_dirstate, METH_VARARGS, "parse a dirstate\n"},
1912 {"parse_index2", parse_index2, METH_VARARGS, "parse a revlog index\n"},
1916 {"parse_index2", parse_index2, METH_VARARGS, "parse a revlog index\n"},
1913 {"encodedir", encodedir, METH_VARARGS, "encodedir a path\n"},
1917 {"encodedir", encodedir, METH_VARARGS, "encodedir a path\n"},
1914 {"pathencode", pathencode, METH_VARARGS, "fncache-encode a path\n"},
1918 {"pathencode", pathencode, METH_VARARGS, "fncache-encode a path\n"},
1915 {"lowerencode", lowerencode, METH_VARARGS, "lower-encode a path\n"},
1919 {"lowerencode", lowerencode, METH_VARARGS, "lower-encode a path\n"},
1916 {NULL, NULL}
1920 {NULL, NULL}
1917 };
1921 };
1918
1922
1919 void dirs_module_init(PyObject *mod);
1923 void dirs_module_init(PyObject *mod);
1920
1924
1921 static void module_init(PyObject *mod)
1925 static void module_init(PyObject *mod)
1922 {
1926 {
1923 dirs_module_init(mod);
1927 dirs_module_init(mod);
1924
1928
1925 indexType.tp_new = PyType_GenericNew;
1929 indexType.tp_new = PyType_GenericNew;
1926 if (PyType_Ready(&indexType) < 0)
1930 if (PyType_Ready(&indexType) < 0)
1927 return;
1931 return;
1928 Py_INCREF(&indexType);
1932 Py_INCREF(&indexType);
1929
1933
1930 PyModule_AddObject(mod, "index", (PyObject *)&indexType);
1934 PyModule_AddObject(mod, "index", (PyObject *)&indexType);
1931
1935
1932 nullentry = Py_BuildValue("iiiiiiis#", 0, 0, 0,
1936 nullentry = Py_BuildValue("iiiiiiis#", 0, 0, 0,
1933 -1, -1, -1, -1, nullid, 20);
1937 -1, -1, -1, -1, nullid, 20);
1934 if (nullentry)
1938 if (nullentry)
1935 PyObject_GC_UnTrack(nullentry);
1939 PyObject_GC_UnTrack(nullentry);
1936
1940
1937 dirstate_unset = Py_BuildValue("ciii", 'n', 0, -1, -1);
1941 dirstate_unset = Py_BuildValue("ciii", 'n', 0, -1, -1);
1938 }
1942 }
1939
1943
1940 #ifdef IS_PY3K
1944 #ifdef IS_PY3K
1941 static struct PyModuleDef parsers_module = {
1945 static struct PyModuleDef parsers_module = {
1942 PyModuleDef_HEAD_INIT,
1946 PyModuleDef_HEAD_INIT,
1943 "parsers",
1947 "parsers",
1944 parsers_doc,
1948 parsers_doc,
1945 -1,
1949 -1,
1946 methods
1950 methods
1947 };
1951 };
1948
1952
1949 PyMODINIT_FUNC PyInit_parsers(void)
1953 PyMODINIT_FUNC PyInit_parsers(void)
1950 {
1954 {
1951 PyObject *mod = PyModule_Create(&parsers_module);
1955 PyObject *mod = PyModule_Create(&parsers_module);
1952 module_init(mod);
1956 module_init(mod);
1953 return mod;
1957 return mod;
1954 }
1958 }
1955 #else
1959 #else
1956 PyMODINIT_FUNC initparsers(void)
1960 PyMODINIT_FUNC initparsers(void)
1957 {
1961 {
1958 PyObject *mod = Py_InitModule3("parsers", methods, parsers_doc);
1962 PyObject *mod = Py_InitModule3("parsers", methods, parsers_doc);
1959 module_init(mod);
1963 module_init(mod);
1960 }
1964 }
1961 #endif
1965 #endif
@@ -1,126 +1,134
1 from mercurial import parsers
1 from mercurial import parsers
2 from mercurial.node import nullid, nullrev
2 from mercurial.node import nullid, nullrev
3 import struct
3 import struct
4
4
5 # This unit test compares the return value of the original Python
5 # This unit test compares the return value of the original Python
6 # implementation of parseindex and the new C implementation for
6 # implementation of parseindex and the new C implementation for
7 # an index file with and without inlined data
7 # an index file with and without inlined data
8
8
9 # original python implementation
9 # original python implementation
10 def gettype(q):
10 def gettype(q):
11 return int(q & 0xFFFF)
11 return int(q & 0xFFFF)
12
12
13 def offset_type(offset, type):
13 def offset_type(offset, type):
14 return long(long(offset) << 16 | type)
14 return long(long(offset) << 16 | type)
15
15
16 indexformatng = ">Qiiiiii20s12x"
16 indexformatng = ">Qiiiiii20s12x"
17
17
18 def py_parseindex(data, inline) :
18 def py_parseindex(data, inline) :
19 s = 64
19 s = 64
20 cache = None
20 cache = None
21 index = []
21 index = []
22 nodemap = {nullid: nullrev}
22 nodemap = {nullid: nullrev}
23 n = off = 0
23 n = off = 0
24
24
25 l = len(data) - s
25 l = len(data) - s
26 append = index.append
26 append = index.append
27 if inline:
27 if inline:
28 cache = (0, data)
28 cache = (0, data)
29 while off <= l:
29 while off <= l:
30 e = struct.unpack(indexformatng, data[off:off + s])
30 e = struct.unpack(indexformatng, data[off:off + s])
31 nodemap[e[7]] = n
31 nodemap[e[7]] = n
32 append(e)
32 append(e)
33 n += 1
33 n += 1
34 if e[1] < 0:
34 if e[1] < 0:
35 break
35 break
36 off += e[1] + s
36 off += e[1] + s
37 else:
37 else:
38 while off <= l:
38 while off <= l:
39 e = struct.unpack(indexformatng, data[off:off + s])
39 e = struct.unpack(indexformatng, data[off:off + s])
40 nodemap[e[7]] = n
40 nodemap[e[7]] = n
41 append(e)
41 append(e)
42 n += 1
42 n += 1
43 off += s
43 off += s
44
44
45 e = list(index[0])
45 e = list(index[0])
46 type = gettype(e[0])
46 type = gettype(e[0])
47 e[0] = offset_type(0, type)
47 e[0] = offset_type(0, type)
48 index[0] = tuple(e)
48 index[0] = tuple(e)
49
49
50 # add the magic null revision at -1
50 # add the magic null revision at -1
51 index.append((0, 0, 0, -1, -1, -1, -1, nullid))
51 index.append((0, 0, 0, -1, -1, -1, -1, nullid))
52
52
53 return index, cache
53 return index, cache
54
54
55 data_inlined = '\x00\x01\x00\x01\x00\x00\x00\x00\x00\x00\x01\x8c' \
55 data_inlined = '\x00\x01\x00\x01\x00\x00\x00\x00\x00\x00\x01\x8c' \
56 '\x00\x00\x04\x07\x00\x00\x00\x00\x00\x00\x15\x15\xff\xff\xff' \
56 '\x00\x00\x04\x07\x00\x00\x00\x00\x00\x00\x15\x15\xff\xff\xff' \
57 '\xff\xff\xff\xff\xff\xebG\x97\xb7\x1fB\x04\xcf\x13V\x81\tw\x1b' \
57 '\xff\xff\xff\xff\xff\xebG\x97\xb7\x1fB\x04\xcf\x13V\x81\tw\x1b' \
58 'w\xdduR\xda\xc6\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00' \
58 'w\xdduR\xda\xc6\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00' \
59 'x\x9c\x9d\x93?O\xc30\x10\xc5\xf7|\x8a\xdb\x9a\xa8m\x06\xd8*\x95' \
59 'x\x9c\x9d\x93?O\xc30\x10\xc5\xf7|\x8a\xdb\x9a\xa8m\x06\xd8*\x95' \
60 '\x81B\xa1\xa2\xa2R\xcb\x86Pd\x9a\x0b5$vd_\x04\xfd\xf6\x9c\xff@' \
60 '\x81B\xa1\xa2\xa2R\xcb\x86Pd\x9a\x0b5$vd_\x04\xfd\xf6\x9c\xff@' \
61 '\x11!\x0b\xd9\xec\xf7\xbbw\xe7gG6\xad6\x04\xdaN\xc0\x92\xa0$)' \
61 '\x11!\x0b\xd9\xec\xf7\xbbw\xe7gG6\xad6\x04\xdaN\xc0\x92\xa0$)' \
62 '\xb1\x82\xa2\xd1%\x16\xa4\x8b7\xa9\xca\xd4-\xb2Y\x02\xfc\xc9' \
62 '\xb1\x82\xa2\xd1%\x16\xa4\x8b7\xa9\xca\xd4-\xb2Y\x02\xfc\xc9' \
63 '\xcaS\xf9\xaeX\xed\xb6\xd77Q\x02\x83\xd4\x19\xf5--Y\xea\xe1W' \
63 '\xcaS\xf9\xaeX\xed\xb6\xd77Q\x02\x83\xd4\x19\xf5--Y\xea\xe1W' \
64 '\xab\xed\x10\xceR\x0f_\xdf\xdf\r\xe1,\xf5\xf0\xcb\xf5 \xceR\x0f' \
64 '\xab\xed\x10\xceR\x0f_\xdf\xdf\r\xe1,\xf5\xf0\xcb\xf5 \xceR\x0f' \
65 '_\xdc\x0e\x0e\xc3R\x0f_\xae\x96\x9b!\x9e\xa5\x1e\xbf\xdb,\x06' \
65 '_\xdc\x0e\x0e\xc3R\x0f_\xae\x96\x9b!\x9e\xa5\x1e\xbf\xdb,\x06' \
66 '\xc7q\x9a/\x88\x82\xc3B\xea\xb5\xb4TJ\x93\xb6\x82\x0e\xe16\xe6' \
66 '\xc7q\x9a/\x88\x82\xc3B\xea\xb5\xb4TJ\x93\xb6\x82\x0e\xe16\xe6' \
67 'KQ\xdb\xaf\xecG\xa3\xd1 \x01\xd3\x0b_^\xe8\xaa\xa0\xae\xad\xd1' \
67 'KQ\xdb\xaf\xecG\xa3\xd1 \x01\xd3\x0b_^\xe8\xaa\xa0\xae\xad\xd1' \
68 '&\xbef\x1bz\x08\xb0|\xc9Xz\x06\xf6Z\x91\x90J\xaa\x17\x90\xaa' \
68 '&\xbef\x1bz\x08\xb0|\xc9Xz\x06\xf6Z\x91\x90J\xaa\x17\x90\xaa' \
69 '\xd2\xa6\x11$5C\xcf\xba#\xa0\x03\x02*2\x92-\xfc\xb1\x94\xdf\xe2' \
69 '\xd2\xa6\x11$5C\xcf\xba#\xa0\x03\x02*2\x92-\xfc\xb1\x94\xdf\xe2' \
70 '\xae\xb8\'m\x8ey0^\x85\xd3\x82\xb4\xf0`:\x9c\x00\x8a\xfd\x01' \
70 '\xae\xb8\'m\x8ey0^\x85\xd3\x82\xb4\xf0`:\x9c\x00\x8a\xfd\x01' \
71 '\xb0\xc6\x86\x8b\xdd\xae\x80\xf3\xa9\x9fd\x16\n\x00R%\x1a\x06' \
71 '\xb0\xc6\x86\x8b\xdd\xae\x80\xf3\xa9\x9fd\x16\n\x00R%\x1a\x06' \
72 '\xe9\xd8b\x98\x1d\xf4\xf3+\x9bf\x01\xd8p\x1b\xf3.\xed\x9f^g\xc3' \
72 '\xe9\xd8b\x98\x1d\xf4\xf3+\x9bf\x01\xd8p\x1b\xf3.\xed\x9f^g\xc3' \
73 '^\xd9W81T\xdb\xd5\x04sx|\xf2\xeb\xd6`%?x\xed"\x831\xbf\xf3\xdc' \
73 '^\xd9W81T\xdb\xd5\x04sx|\xf2\xeb\xd6`%?x\xed"\x831\xbf\xf3\xdc' \
74 'b\xeb%gaY\xe1\xad\x9f\xb9f\'1w\xa9\xa5a\x83s\x82J\xb98\xbc4\x8b' \
74 'b\xeb%gaY\xe1\xad\x9f\xb9f\'1w\xa9\xa5a\x83s\x82J\xb98\xbc4\x8b' \
75 '\x83\x00\x9f$z\xb8#\xa5\xb1\xdf\x98\xd9\xec\x1b\x89O\xe3Ts\x9a4' \
75 '\x83\x00\x9f$z\xb8#\xa5\xb1\xdf\x98\xd9\xec\x1b\x89O\xe3Ts\x9a4' \
76 '\x17m\x8b\xfc\x8f\xa5\x95\x9a\xfc\xfa\xed,\xe5|\xa1\xfe\x15\xb9' \
76 '\x17m\x8b\xfc\x8f\xa5\x95\x9a\xfc\xfa\xed,\xe5|\xa1\xfe\x15\xb9' \
77 '\xbc\xb2\x93\x1f\xf2\x95\xff\xdf,\x1a\xc5\xe7\x17*\x93Oz:>\x0e'
77 '\xbc\xb2\x93\x1f\xf2\x95\xff\xdf,\x1a\xc5\xe7\x17*\x93Oz:>\x0e'
78
78
79 data_non_inlined = '\x00\x00\x00\x01\x00\x00\x00\x00\x00\x01D\x19' \
79 data_non_inlined = '\x00\x00\x00\x01\x00\x00\x00\x00\x00\x01D\x19' \
80 '\x00\x07e\x12\x00\x00\x00\x00\x00\x00\x00\x00\xff\xff\xff\xff' \
80 '\x00\x07e\x12\x00\x00\x00\x00\x00\x00\x00\x00\xff\xff\xff\xff' \
81 '\xff\xff\xff\xff\xd1\xf4\xbb\xb0\xbe\xfc\x13\xbd\x8c\xd3\x9d' \
81 '\xff\xff\xff\xff\xd1\xf4\xbb\xb0\xbe\xfc\x13\xbd\x8c\xd3\x9d' \
82 '\x0f\xcd\xd9;\x8c\x07\x8cJ/\x00\x00\x00\x00\x00\x00\x00\x00\x00' \
82 '\x0f\xcd\xd9;\x8c\x07\x8cJ/\x00\x00\x00\x00\x00\x00\x00\x00\x00' \
83 '\x00\x00\x00\x00\x00\x00\x01D\x19\x00\x00\x00\x00\x00\xdf\x00' \
83 '\x00\x00\x00\x00\x00\x00\x01D\x19\x00\x00\x00\x00\x00\xdf\x00' \
84 '\x00\x01q\x00\x00\x00\x01\x00\x00\x00\x01\x00\x00\x00\x00\xff' \
84 '\x00\x01q\x00\x00\x00\x01\x00\x00\x00\x01\x00\x00\x00\x00\xff' \
85 '\xff\xff\xff\xc1\x12\xb9\x04\x96\xa4Z1t\x91\xdfsJ\x90\xf0\x9bh' \
85 '\xff\xff\xff\xc1\x12\xb9\x04\x96\xa4Z1t\x91\xdfsJ\x90\xf0\x9bh' \
86 '\x07l&\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00' \
86 '\x07l&\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00' \
87 '\x00\x01D\xf8\x00\x00\x00\x00\x01\x1b\x00\x00\x01\xb8\x00\x00' \
87 '\x00\x01D\xf8\x00\x00\x00\x00\x01\x1b\x00\x00\x01\xb8\x00\x00' \
88 '\x00\x01\x00\x00\x00\x02\x00\x00\x00\x01\xff\xff\xff\xff\x02\n' \
88 '\x00\x01\x00\x00\x00\x02\x00\x00\x00\x01\xff\xff\xff\xff\x02\n' \
89 '\x0e\xc6&\xa1\x92\xae6\x0b\x02i\xfe-\xe5\xbao\x05\xd1\xe7\x00' \
89 '\x0e\xc6&\xa1\x92\xae6\x0b\x02i\xfe-\xe5\xbao\x05\xd1\xe7\x00' \
90 '\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x01F' \
90 '\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x01F' \
91 '\x13\x00\x00\x00\x00\x01\xec\x00\x00\x03\x06\x00\x00\x00\x01' \
91 '\x13\x00\x00\x00\x00\x01\xec\x00\x00\x03\x06\x00\x00\x00\x01' \
92 '\x00\x00\x00\x03\x00\x00\x00\x02\xff\xff\xff\xff\x12\xcb\xeby1' \
92 '\x00\x00\x00\x03\x00\x00\x00\x02\xff\xff\xff\xff\x12\xcb\xeby1' \
93 '\xb6\r\x98B\xcb\x07\xbd`\x8f\x92\xd9\xc4\x84\xbdK\x00\x00\x00' \
93 '\xb6\r\x98B\xcb\x07\xbd`\x8f\x92\xd9\xc4\x84\xbdK\x00\x00\x00' \
94 '\x00\x00\x00\x00\x00\x00\x00\x00\x00'
94 '\x00\x00\x00\x00\x00\x00\x00\x00\x00'
95
95
96 def parse_index2(data, inline):
96 def parse_index2(data, inline):
97 index, chunkcache = parsers.parse_index2(data, inline)
97 index, chunkcache = parsers.parse_index2(data, inline)
98 return list(index), chunkcache
98 return list(index), chunkcache
99
99
100 def runtest() :
100 def runtest() :
101 # Check that parse_index2() raises TypeError on bad arguments.
102 try:
103 parse_index2(0, True)
104 except TypeError:
105 pass
106 else:
107 print "Expected to get TypeError."
108
101 py_res_1 = py_parseindex(data_inlined, True)
109 py_res_1 = py_parseindex(data_inlined, True)
102 c_res_1 = parse_index2(data_inlined, True)
110 c_res_1 = parse_index2(data_inlined, True)
103
111
104 py_res_2 = py_parseindex(data_non_inlined, False)
112 py_res_2 = py_parseindex(data_non_inlined, False)
105 c_res_2 = parse_index2(data_non_inlined, False)
113 c_res_2 = parse_index2(data_non_inlined, False)
106
114
107 if py_res_1 != c_res_1:
115 if py_res_1 != c_res_1:
108 print "Parse index result (with inlined data) differs!"
116 print "Parse index result (with inlined data) differs!"
109
117
110 if py_res_2 != c_res_2:
118 if py_res_2 != c_res_2:
111 print "Parse index result (no inlined data) differs!"
119 print "Parse index result (no inlined data) differs!"
112
120
113 ix = parsers.parse_index2(data_inlined, True)[0]
121 ix = parsers.parse_index2(data_inlined, True)[0]
114 for i, r in enumerate(ix):
122 for i, r in enumerate(ix):
115 if r[7] == nullid:
123 if r[7] == nullid:
116 i = -1
124 i = -1
117 try:
125 try:
118 if ix[r[7]] != i:
126 if ix[r[7]] != i:
119 print 'Reverse lookup inconsistent for %r' % r[7].encode('hex')
127 print 'Reverse lookup inconsistent for %r' % r[7].encode('hex')
120 except TypeError:
128 except TypeError:
121 # pure version doesn't support this
129 # pure version doesn't support this
122 break
130 break
123
131
124 print "done"
132 print "done"
125
133
126 runtest()
134 runtest()
General Comments 0
You need to be logged in to leave comments. Login now