##// END OF EJS Templates
cext: move braces for control statements to same line...
Gregory Szorc -
r34438:ce26a138 default
parent child Browse files
Show More
@@ -1,189 +1,185 b''
1 /*
1 /*
2 base85 codec
2 base85 codec
3
3
4 Copyright 2006 Brendan Cully <brendan@kublai.com>
4 Copyright 2006 Brendan Cully <brendan@kublai.com>
5
5
6 This software may be used and distributed according to the terms of
6 This software may be used and distributed according to the terms of
7 the GNU General Public License, incorporated herein by reference.
7 the GNU General Public License, incorporated herein by reference.
8
8
9 Largely based on git's implementation
9 Largely based on git's implementation
10 */
10 */
11
11
12 #define PY_SSIZE_T_CLEAN
12 #define PY_SSIZE_T_CLEAN
13 #include <Python.h>
13 #include <Python.h>
14
14
15 #include "util.h"
15 #include "util.h"
16
16
17 static const char b85chars[] = "0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ"
17 static const char b85chars[] = "0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ"
18 "abcdefghijklmnopqrstuvwxyz!#$%&()*+-;<=>?@^_`{|}~";
18 "abcdefghijklmnopqrstuvwxyz!#$%&()*+-;<=>?@^_`{|}~";
19 static char b85dec[256];
19 static char b85dec[256];
20
20
21 static void b85prep(void)
21 static void b85prep(void)
22 {
22 {
23 unsigned i;
23 unsigned i;
24
24
25 memset(b85dec, 0, sizeof(b85dec));
25 memset(b85dec, 0, sizeof(b85dec));
26 for (i = 0; i < sizeof(b85chars); i++)
26 for (i = 0; i < sizeof(b85chars); i++)
27 b85dec[(int)(b85chars[i])] = i + 1;
27 b85dec[(int)(b85chars[i])] = i + 1;
28 }
28 }
29
29
30 static PyObject *b85encode(PyObject *self, PyObject *args)
30 static PyObject *b85encode(PyObject *self, PyObject *args)
31 {
31 {
32 const unsigned char *text;
32 const unsigned char *text;
33 PyObject *out;
33 PyObject *out;
34 char *dst;
34 char *dst;
35 Py_ssize_t len, olen, i;
35 Py_ssize_t len, olen, i;
36 unsigned int acc, val, ch;
36 unsigned int acc, val, ch;
37 int pad = 0;
37 int pad = 0;
38
38
39 if (!PyArg_ParseTuple(args, "s#|i", &text, &len, &pad))
39 if (!PyArg_ParseTuple(args, "s#|i", &text, &len, &pad))
40 return NULL;
40 return NULL;
41
41
42 if (pad)
42 if (pad)
43 olen = ((len + 3) / 4 * 5) - 3;
43 olen = ((len + 3) / 4 * 5) - 3;
44 else {
44 else {
45 olen = len % 4;
45 olen = len % 4;
46 if (olen)
46 if (olen)
47 olen++;
47 olen++;
48 olen += len / 4 * 5;
48 olen += len / 4 * 5;
49 }
49 }
50 if (!(out = PyBytes_FromStringAndSize(NULL, olen + 3)))
50 if (!(out = PyBytes_FromStringAndSize(NULL, olen + 3)))
51 return NULL;
51 return NULL;
52
52
53 dst = PyBytes_AsString(out);
53 dst = PyBytes_AsString(out);
54
54
55 while (len) {
55 while (len) {
56 acc = 0;
56 acc = 0;
57 for (i = 24; i >= 0; i -= 8) {
57 for (i = 24; i >= 0; i -= 8) {
58 ch = *text++;
58 ch = *text++;
59 acc |= ch << i;
59 acc |= ch << i;
60 if (--len == 0)
60 if (--len == 0)
61 break;
61 break;
62 }
62 }
63 for (i = 4; i >= 0; i--) {
63 for (i = 4; i >= 0; i--) {
64 val = acc % 85;
64 val = acc % 85;
65 acc /= 85;
65 acc /= 85;
66 dst[i] = b85chars[val];
66 dst[i] = b85chars[val];
67 }
67 }
68 dst += 5;
68 dst += 5;
69 }
69 }
70
70
71 if (!pad)
71 if (!pad)
72 _PyBytes_Resize(&out, olen);
72 _PyBytes_Resize(&out, olen);
73
73
74 return out;
74 return out;
75 }
75 }
76
76
77 static PyObject *b85decode(PyObject *self, PyObject *args)
77 static PyObject *b85decode(PyObject *self, PyObject *args)
78 {
78 {
79 PyObject *out;
79 PyObject *out;
80 const char *text;
80 const char *text;
81 char *dst;
81 char *dst;
82 Py_ssize_t len, i, j, olen, cap;
82 Py_ssize_t len, i, j, olen, cap;
83 int c;
83 int c;
84 unsigned int acc;
84 unsigned int acc;
85
85
86 if (!PyArg_ParseTuple(args, "s#", &text, &len))
86 if (!PyArg_ParseTuple(args, "s#", &text, &len))
87 return NULL;
87 return NULL;
88
88
89 olen = len / 5 * 4;
89 olen = len / 5 * 4;
90 i = len % 5;
90 i = len % 5;
91 if (i)
91 if (i)
92 olen += i - 1;
92 olen += i - 1;
93 if (!(out = PyBytes_FromStringAndSize(NULL, olen)))
93 if (!(out = PyBytes_FromStringAndSize(NULL, olen)))
94 return NULL;
94 return NULL;
95
95
96 dst = PyBytes_AsString(out);
96 dst = PyBytes_AsString(out);
97
97
98 i = 0;
98 i = 0;
99 while (i < len)
99 while (i < len) {
100 {
101 acc = 0;
100 acc = 0;
102 cap = len - i - 1;
101 cap = len - i - 1;
103 if (cap > 4)
102 if (cap > 4)
104 cap = 4;
103 cap = 4;
105 for (j = 0; j < cap; i++, j++)
104 for (j = 0; j < cap; i++, j++) {
106 {
107 c = b85dec[(int)*text++] - 1;
105 c = b85dec[(int)*text++] - 1;
108 if (c < 0)
106 if (c < 0)
109 return PyErr_Format(
107 return PyErr_Format(
110 PyExc_ValueError,
108 PyExc_ValueError,
111 "bad base85 character at position %d",
109 "bad base85 character at position %d",
112 (int)i);
110 (int)i);
113 acc = acc * 85 + c;
111 acc = acc * 85 + c;
114 }
112 }
115 if (i++ < len)
113 if (i++ < len) {
116 {
117 c = b85dec[(int)*text++] - 1;
114 c = b85dec[(int)*text++] - 1;
118 if (c < 0)
115 if (c < 0)
119 return PyErr_Format(
116 return PyErr_Format(
120 PyExc_ValueError,
117 PyExc_ValueError,
121 "bad base85 character at position %d",
118 "bad base85 character at position %d",
122 (int)i);
119 (int)i);
123 /* overflow detection: 0xffffffff == "|NsC0",
120 /* overflow detection: 0xffffffff == "|NsC0",
124 * "|NsC" == 0x03030303 */
121 * "|NsC" == 0x03030303 */
125 if (acc > 0x03030303 || (acc *= 85) > 0xffffffff - c)
122 if (acc > 0x03030303 || (acc *= 85) > 0xffffffff - c)
126 return PyErr_Format(
123 return PyErr_Format(
127 PyExc_ValueError,
124 PyExc_ValueError,
128 "bad base85 sequence at position %d",
125 "bad base85 sequence at position %d",
129 (int)i);
126 (int)i);
130 acc += c;
127 acc += c;
131 }
128 }
132
129
133 cap = olen < 4 ? olen : 4;
130 cap = olen < 4 ? olen : 4;
134 olen -= cap;
131 olen -= cap;
135 for (j = 0; j < 4 - cap; j++)
132 for (j = 0; j < 4 - cap; j++)
136 acc *= 85;
133 acc *= 85;
137 if (cap && cap < 4)
134 if (cap && cap < 4)
138 acc += 0xffffff >> (cap - 1) * 8;
135 acc += 0xffffff >> (cap - 1) * 8;
139 for (j = 0; j < cap; j++)
136 for (j = 0; j < cap; j++) {
140 {
141 acc = (acc << 8) | (acc >> 24);
137 acc = (acc << 8) | (acc >> 24);
142 *dst++ = acc;
138 *dst++ = acc;
143 }
139 }
144 }
140 }
145
141
146 return out;
142 return out;
147 }
143 }
148
144
149 static char base85_doc[] = "Base85 Data Encoding";
145 static char base85_doc[] = "Base85 Data Encoding";
150
146
151 static PyMethodDef methods[] = {
147 static PyMethodDef methods[] = {
152 {"b85encode", b85encode, METH_VARARGS,
148 {"b85encode", b85encode, METH_VARARGS,
153 "Encode text in base85.\n\n"
149 "Encode text in base85.\n\n"
154 "If the second parameter is true, pad the result to a multiple of "
150 "If the second parameter is true, pad the result to a multiple of "
155 "five characters.\n"},
151 "five characters.\n"},
156 {"b85decode", b85decode, METH_VARARGS, "Decode base85 text.\n"},
152 {"b85decode", b85decode, METH_VARARGS, "Decode base85 text.\n"},
157 {NULL, NULL}
153 {NULL, NULL}
158 };
154 };
159
155
160 static const int version = 1;
156 static const int version = 1;
161
157
162 #ifdef IS_PY3K
158 #ifdef IS_PY3K
163 static struct PyModuleDef base85_module = {
159 static struct PyModuleDef base85_module = {
164 PyModuleDef_HEAD_INIT,
160 PyModuleDef_HEAD_INIT,
165 "base85",
161 "base85",
166 base85_doc,
162 base85_doc,
167 -1,
163 -1,
168 methods
164 methods
169 };
165 };
170
166
171 PyMODINIT_FUNC PyInit_base85(void)
167 PyMODINIT_FUNC PyInit_base85(void)
172 {
168 {
173 PyObject *m;
169 PyObject *m;
174 b85prep();
170 b85prep();
175
171
176 m = PyModule_Create(&base85_module);
172 m = PyModule_Create(&base85_module);
177 PyModule_AddIntConstant(m, "version", version);
173 PyModule_AddIntConstant(m, "version", version);
178 return m;
174 return m;
179 }
175 }
180 #else
176 #else
181 PyMODINIT_FUNC initbase85(void)
177 PyMODINIT_FUNC initbase85(void)
182 {
178 {
183 PyObject *m;
179 PyObject *m;
184 m = Py_InitModule3("base85", methods, base85_doc);
180 m = Py_InitModule3("base85", methods, base85_doc);
185
181
186 b85prep();
182 b85prep();
187 PyModule_AddIntConstant(m, "version", version);
183 PyModule_AddIntConstant(m, "version", version);
188 }
184 }
189 #endif
185 #endif
@@ -1,2090 +1,2089 b''
1 /*
1 /*
2 parsers.c - efficient content parsing
2 parsers.c - efficient content parsing
3
3
4 Copyright 2008 Matt Mackall <mpm@selenic.com> and others
4 Copyright 2008 Matt Mackall <mpm@selenic.com> and others
5
5
6 This software may be used and distributed according to the terms of
6 This software may be used and distributed according to the terms of
7 the GNU General Public License, incorporated herein by reference.
7 the GNU General Public License, incorporated herein by reference.
8 */
8 */
9
9
10 #include <Python.h>
10 #include <Python.h>
11 #include <assert.h>
11 #include <assert.h>
12 #include <ctype.h>
12 #include <ctype.h>
13 #include <stddef.h>
13 #include <stddef.h>
14 #include <string.h>
14 #include <string.h>
15
15
16 #include "charencode.h"
16 #include "charencode.h"
17 #include "util.h"
17 #include "util.h"
18 #include "bitmanipulation.h"
18 #include "bitmanipulation.h"
19
19
20 #ifdef IS_PY3K
20 #ifdef IS_PY3K
21 /* The mapping of Python types is meant to be temporary to get Python
21 /* The mapping of Python types is meant to be temporary to get Python
22 * 3 to compile. We should remove this once Python 3 support is fully
22 * 3 to compile. We should remove this once Python 3 support is fully
23 * supported and proper types are used in the extensions themselves. */
23 * supported and proper types are used in the extensions themselves. */
24 #define PyInt_Check PyLong_Check
24 #define PyInt_Check PyLong_Check
25 #define PyInt_FromLong PyLong_FromLong
25 #define PyInt_FromLong PyLong_FromLong
26 #define PyInt_FromSsize_t PyLong_FromSsize_t
26 #define PyInt_FromSsize_t PyLong_FromSsize_t
27 #define PyInt_AS_LONG PyLong_AS_LONG
27 #define PyInt_AS_LONG PyLong_AS_LONG
28 #define PyInt_AsLong PyLong_AsLong
28 #define PyInt_AsLong PyLong_AsLong
29 #endif
29 #endif
30
30
31 /*
31 /*
32 * A base-16 trie for fast node->rev mapping.
32 * A base-16 trie for fast node->rev mapping.
33 *
33 *
34 * Positive value is index of the next node in the trie
34 * Positive value is index of the next node in the trie
35 * Negative value is a leaf: -(rev + 1)
35 * Negative value is a leaf: -(rev + 1)
36 * Zero is empty
36 * Zero is empty
37 */
37 */
38 typedef struct {
38 typedef struct {
39 int children[16];
39 int children[16];
40 } nodetree;
40 } nodetree;
41
41
42 /*
42 /*
43 * This class has two behaviors.
43 * This class has two behaviors.
44 *
44 *
45 * When used in a list-like way (with integer keys), we decode an
45 * When used in a list-like way (with integer keys), we decode an
46 * entry in a RevlogNG index file on demand. Our last entry is a
46 * entry in a RevlogNG index file on demand. Our last entry is a
47 * sentinel, always a nullid. We have limited support for
47 * sentinel, always a nullid. We have limited support for
48 * integer-keyed insert and delete, only at elements right before the
48 * integer-keyed insert and delete, only at elements right before the
49 * sentinel.
49 * sentinel.
50 *
50 *
51 * With string keys, we lazily perform a reverse mapping from node to
51 * With string keys, we lazily perform a reverse mapping from node to
52 * rev, using a base-16 trie.
52 * rev, using a base-16 trie.
53 */
53 */
54 typedef struct {
54 typedef struct {
55 PyObject_HEAD
55 PyObject_HEAD
56 /* Type-specific fields go here. */
56 /* Type-specific fields go here. */
57 PyObject *data; /* raw bytes of index */
57 PyObject *data; /* raw bytes of index */
58 Py_buffer buf; /* buffer of data */
58 Py_buffer buf; /* buffer of data */
59 PyObject **cache; /* cached tuples */
59 PyObject **cache; /* cached tuples */
60 const char **offsets; /* populated on demand */
60 const char **offsets; /* populated on demand */
61 Py_ssize_t raw_length; /* original number of elements */
61 Py_ssize_t raw_length; /* original number of elements */
62 Py_ssize_t length; /* current number of elements */
62 Py_ssize_t length; /* current number of elements */
63 PyObject *added; /* populated on demand */
63 PyObject *added; /* populated on demand */
64 PyObject *headrevs; /* cache, invalidated on changes */
64 PyObject *headrevs; /* cache, invalidated on changes */
65 PyObject *filteredrevs;/* filtered revs set */
65 PyObject *filteredrevs;/* filtered revs set */
66 nodetree *nt; /* base-16 trie */
66 nodetree *nt; /* base-16 trie */
67 unsigned ntlength; /* # nodes in use */
67 unsigned ntlength; /* # nodes in use */
68 unsigned ntcapacity; /* # nodes allocated */
68 unsigned ntcapacity; /* # nodes allocated */
69 int ntdepth; /* maximum depth of tree */
69 int ntdepth; /* maximum depth of tree */
70 int ntsplits; /* # splits performed */
70 int ntsplits; /* # splits performed */
71 int ntrev; /* last rev scanned */
71 int ntrev; /* last rev scanned */
72 int ntlookups; /* # lookups */
72 int ntlookups; /* # lookups */
73 int ntmisses; /* # lookups that miss the cache */
73 int ntmisses; /* # lookups that miss the cache */
74 int inlined;
74 int inlined;
75 } indexObject;
75 } indexObject;
76
76
77 static Py_ssize_t index_length(const indexObject *self)
77 static Py_ssize_t index_length(const indexObject *self)
78 {
78 {
79 if (self->added == NULL)
79 if (self->added == NULL)
80 return self->length;
80 return self->length;
81 return self->length + PyList_GET_SIZE(self->added);
81 return self->length + PyList_GET_SIZE(self->added);
82 }
82 }
83
83
84 static PyObject *nullentry;
84 static PyObject *nullentry;
85 static const char nullid[20];
85 static const char nullid[20];
86
86
87 static Py_ssize_t inline_scan(indexObject *self, const char **offsets);
87 static Py_ssize_t inline_scan(indexObject *self, const char **offsets);
88
88
89 #if LONG_MAX == 0x7fffffffL
89 #if LONG_MAX == 0x7fffffffL
90 static char *tuple_format = "Kiiiiiis#";
90 static char *tuple_format = "Kiiiiiis#";
91 #else
91 #else
92 static char *tuple_format = "kiiiiiis#";
92 static char *tuple_format = "kiiiiiis#";
93 #endif
93 #endif
94
94
95 /* A RevlogNG v1 index entry is 64 bytes long. */
95 /* A RevlogNG v1 index entry is 64 bytes long. */
96 static const long v1_hdrsize = 64;
96 static const long v1_hdrsize = 64;
97
97
98 /*
98 /*
99 * Return a pointer to the beginning of a RevlogNG record.
99 * Return a pointer to the beginning of a RevlogNG record.
100 */
100 */
101 static const char *index_deref(indexObject *self, Py_ssize_t pos)
101 static const char *index_deref(indexObject *self, Py_ssize_t pos)
102 {
102 {
103 if (self->inlined && pos > 0) {
103 if (self->inlined && pos > 0) {
104 if (self->offsets == NULL) {
104 if (self->offsets == NULL) {
105 self->offsets = PyMem_Malloc(self->raw_length *
105 self->offsets = PyMem_Malloc(self->raw_length *
106 sizeof(*self->offsets));
106 sizeof(*self->offsets));
107 if (self->offsets == NULL)
107 if (self->offsets == NULL)
108 return (const char *)PyErr_NoMemory();
108 return (const char *)PyErr_NoMemory();
109 inline_scan(self, self->offsets);
109 inline_scan(self, self->offsets);
110 }
110 }
111 return self->offsets[pos];
111 return self->offsets[pos];
112 }
112 }
113
113
114 return (const char *)(self->buf.buf) + pos * v1_hdrsize;
114 return (const char *)(self->buf.buf) + pos * v1_hdrsize;
115 }
115 }
116
116
117 static inline int index_get_parents(indexObject *self, Py_ssize_t rev,
117 static inline int index_get_parents(indexObject *self, Py_ssize_t rev,
118 int *ps, int maxrev)
118 int *ps, int maxrev)
119 {
119 {
120 if (rev >= self->length - 1) {
120 if (rev >= self->length - 1) {
121 PyObject *tuple = PyList_GET_ITEM(self->added,
121 PyObject *tuple = PyList_GET_ITEM(self->added,
122 rev - self->length + 1);
122 rev - self->length + 1);
123 ps[0] = (int)PyInt_AS_LONG(PyTuple_GET_ITEM(tuple, 5));
123 ps[0] = (int)PyInt_AS_LONG(PyTuple_GET_ITEM(tuple, 5));
124 ps[1] = (int)PyInt_AS_LONG(PyTuple_GET_ITEM(tuple, 6));
124 ps[1] = (int)PyInt_AS_LONG(PyTuple_GET_ITEM(tuple, 6));
125 } else {
125 } else {
126 const char *data = index_deref(self, rev);
126 const char *data = index_deref(self, rev);
127 ps[0] = getbe32(data + 24);
127 ps[0] = getbe32(data + 24);
128 ps[1] = getbe32(data + 28);
128 ps[1] = getbe32(data + 28);
129 }
129 }
130 /* If index file is corrupted, ps[] may point to invalid revisions. So
130 /* If index file is corrupted, ps[] may point to invalid revisions. So
131 * there is a risk of buffer overflow to trust them unconditionally. */
131 * there is a risk of buffer overflow to trust them unconditionally. */
132 if (ps[0] > maxrev || ps[1] > maxrev) {
132 if (ps[0] > maxrev || ps[1] > maxrev) {
133 PyErr_SetString(PyExc_ValueError, "parent out of range");
133 PyErr_SetString(PyExc_ValueError, "parent out of range");
134 return -1;
134 return -1;
135 }
135 }
136 return 0;
136 return 0;
137 }
137 }
138
138
139
139
140 /*
140 /*
141 * RevlogNG format (all in big endian, data may be inlined):
141 * RevlogNG format (all in big endian, data may be inlined):
142 * 6 bytes: offset
142 * 6 bytes: offset
143 * 2 bytes: flags
143 * 2 bytes: flags
144 * 4 bytes: compressed length
144 * 4 bytes: compressed length
145 * 4 bytes: uncompressed length
145 * 4 bytes: uncompressed length
146 * 4 bytes: base revision
146 * 4 bytes: base revision
147 * 4 bytes: link revision
147 * 4 bytes: link revision
148 * 4 bytes: parent 1 revision
148 * 4 bytes: parent 1 revision
149 * 4 bytes: parent 2 revision
149 * 4 bytes: parent 2 revision
150 * 32 bytes: nodeid (only 20 bytes used)
150 * 32 bytes: nodeid (only 20 bytes used)
151 */
151 */
152 static PyObject *index_get(indexObject *self, Py_ssize_t pos)
152 static PyObject *index_get(indexObject *self, Py_ssize_t pos)
153 {
153 {
154 uint64_t offset_flags;
154 uint64_t offset_flags;
155 int comp_len, uncomp_len, base_rev, link_rev, parent_1, parent_2;
155 int comp_len, uncomp_len, base_rev, link_rev, parent_1, parent_2;
156 const char *c_node_id;
156 const char *c_node_id;
157 const char *data;
157 const char *data;
158 Py_ssize_t length = index_length(self);
158 Py_ssize_t length = index_length(self);
159 PyObject *entry;
159 PyObject *entry;
160
160
161 if (pos < 0)
161 if (pos < 0)
162 pos += length;
162 pos += length;
163
163
164 if (pos < 0 || pos >= length) {
164 if (pos < 0 || pos >= length) {
165 PyErr_SetString(PyExc_IndexError, "revlog index out of range");
165 PyErr_SetString(PyExc_IndexError, "revlog index out of range");
166 return NULL;
166 return NULL;
167 }
167 }
168
168
169 if (pos == length - 1) {
169 if (pos == length - 1) {
170 Py_INCREF(nullentry);
170 Py_INCREF(nullentry);
171 return nullentry;
171 return nullentry;
172 }
172 }
173
173
174 if (pos >= self->length - 1) {
174 if (pos >= self->length - 1) {
175 PyObject *obj;
175 PyObject *obj;
176 obj = PyList_GET_ITEM(self->added, pos - self->length + 1);
176 obj = PyList_GET_ITEM(self->added, pos - self->length + 1);
177 Py_INCREF(obj);
177 Py_INCREF(obj);
178 return obj;
178 return obj;
179 }
179 }
180
180
181 if (self->cache) {
181 if (self->cache) {
182 if (self->cache[pos]) {
182 if (self->cache[pos]) {
183 Py_INCREF(self->cache[pos]);
183 Py_INCREF(self->cache[pos]);
184 return self->cache[pos];
184 return self->cache[pos];
185 }
185 }
186 } else {
186 } else {
187 self->cache = calloc(self->raw_length, sizeof(PyObject *));
187 self->cache = calloc(self->raw_length, sizeof(PyObject *));
188 if (self->cache == NULL)
188 if (self->cache == NULL)
189 return PyErr_NoMemory();
189 return PyErr_NoMemory();
190 }
190 }
191
191
192 data = index_deref(self, pos);
192 data = index_deref(self, pos);
193 if (data == NULL)
193 if (data == NULL)
194 return NULL;
194 return NULL;
195
195
196 offset_flags = getbe32(data + 4);
196 offset_flags = getbe32(data + 4);
197 if (pos == 0) /* mask out version number for the first entry */
197 if (pos == 0) /* mask out version number for the first entry */
198 offset_flags &= 0xFFFF;
198 offset_flags &= 0xFFFF;
199 else {
199 else {
200 uint32_t offset_high = getbe32(data);
200 uint32_t offset_high = getbe32(data);
201 offset_flags |= ((uint64_t)offset_high) << 32;
201 offset_flags |= ((uint64_t)offset_high) << 32;
202 }
202 }
203
203
204 comp_len = getbe32(data + 8);
204 comp_len = getbe32(data + 8);
205 uncomp_len = getbe32(data + 12);
205 uncomp_len = getbe32(data + 12);
206 base_rev = getbe32(data + 16);
206 base_rev = getbe32(data + 16);
207 link_rev = getbe32(data + 20);
207 link_rev = getbe32(data + 20);
208 parent_1 = getbe32(data + 24);
208 parent_1 = getbe32(data + 24);
209 parent_2 = getbe32(data + 28);
209 parent_2 = getbe32(data + 28);
210 c_node_id = data + 32;
210 c_node_id = data + 32;
211
211
212 entry = Py_BuildValue(tuple_format, offset_flags, comp_len,
212 entry = Py_BuildValue(tuple_format, offset_flags, comp_len,
213 uncomp_len, base_rev, link_rev,
213 uncomp_len, base_rev, link_rev,
214 parent_1, parent_2, c_node_id, 20);
214 parent_1, parent_2, c_node_id, 20);
215
215
216 if (entry) {
216 if (entry) {
217 PyObject_GC_UnTrack(entry);
217 PyObject_GC_UnTrack(entry);
218 Py_INCREF(entry);
218 Py_INCREF(entry);
219 }
219 }
220
220
221 self->cache[pos] = entry;
221 self->cache[pos] = entry;
222
222
223 return entry;
223 return entry;
224 }
224 }
225
225
226 /*
226 /*
227 * Return the 20-byte SHA of the node corresponding to the given rev.
227 * Return the 20-byte SHA of the node corresponding to the given rev.
228 */
228 */
229 static const char *index_node(indexObject *self, Py_ssize_t pos)
229 static const char *index_node(indexObject *self, Py_ssize_t pos)
230 {
230 {
231 Py_ssize_t length = index_length(self);
231 Py_ssize_t length = index_length(self);
232 const char *data;
232 const char *data;
233
233
234 if (pos == length - 1 || pos == INT_MAX)
234 if (pos == length - 1 || pos == INT_MAX)
235 return nullid;
235 return nullid;
236
236
237 if (pos >= length)
237 if (pos >= length)
238 return NULL;
238 return NULL;
239
239
240 if (pos >= self->length - 1) {
240 if (pos >= self->length - 1) {
241 PyObject *tuple, *str;
241 PyObject *tuple, *str;
242 tuple = PyList_GET_ITEM(self->added, pos - self->length + 1);
242 tuple = PyList_GET_ITEM(self->added, pos - self->length + 1);
243 str = PyTuple_GetItem(tuple, 7);
243 str = PyTuple_GetItem(tuple, 7);
244 return str ? PyBytes_AS_STRING(str) : NULL;
244 return str ? PyBytes_AS_STRING(str) : NULL;
245 }
245 }
246
246
247 data = index_deref(self, pos);
247 data = index_deref(self, pos);
248 return data ? data + 32 : NULL;
248 return data ? data + 32 : NULL;
249 }
249 }
250
250
251 static int nt_insert(indexObject *self, const char *node, int rev);
251 static int nt_insert(indexObject *self, const char *node, int rev);
252
252
253 static int node_check(PyObject *obj, char **node, Py_ssize_t *nodelen)
253 static int node_check(PyObject *obj, char **node, Py_ssize_t *nodelen)
254 {
254 {
255 if (PyBytes_AsStringAndSize(obj, node, nodelen) == -1)
255 if (PyBytes_AsStringAndSize(obj, node, nodelen) == -1)
256 return -1;
256 return -1;
257 if (*nodelen == 20)
257 if (*nodelen == 20)
258 return 0;
258 return 0;
259 PyErr_SetString(PyExc_ValueError, "20-byte hash required");
259 PyErr_SetString(PyExc_ValueError, "20-byte hash required");
260 return -1;
260 return -1;
261 }
261 }
262
262
263 static PyObject *index_insert(indexObject *self, PyObject *args)
263 static PyObject *index_insert(indexObject *self, PyObject *args)
264 {
264 {
265 PyObject *obj;
265 PyObject *obj;
266 char *node;
266 char *node;
267 int index;
267 int index;
268 Py_ssize_t len, nodelen;
268 Py_ssize_t len, nodelen;
269
269
270 if (!PyArg_ParseTuple(args, "iO", &index, &obj))
270 if (!PyArg_ParseTuple(args, "iO", &index, &obj))
271 return NULL;
271 return NULL;
272
272
273 if (!PyTuple_Check(obj) || PyTuple_GET_SIZE(obj) != 8) {
273 if (!PyTuple_Check(obj) || PyTuple_GET_SIZE(obj) != 8) {
274 PyErr_SetString(PyExc_TypeError, "8-tuple required");
274 PyErr_SetString(PyExc_TypeError, "8-tuple required");
275 return NULL;
275 return NULL;
276 }
276 }
277
277
278 if (node_check(PyTuple_GET_ITEM(obj, 7), &node, &nodelen) == -1)
278 if (node_check(PyTuple_GET_ITEM(obj, 7), &node, &nodelen) == -1)
279 return NULL;
279 return NULL;
280
280
281 len = index_length(self);
281 len = index_length(self);
282
282
283 if (index < 0)
283 if (index < 0)
284 index += len;
284 index += len;
285
285
286 if (index != len - 1) {
286 if (index != len - 1) {
287 PyErr_SetString(PyExc_IndexError,
287 PyErr_SetString(PyExc_IndexError,
288 "insert only supported at index -1");
288 "insert only supported at index -1");
289 return NULL;
289 return NULL;
290 }
290 }
291
291
292 if (self->added == NULL) {
292 if (self->added == NULL) {
293 self->added = PyList_New(0);
293 self->added = PyList_New(0);
294 if (self->added == NULL)
294 if (self->added == NULL)
295 return NULL;
295 return NULL;
296 }
296 }
297
297
298 if (PyList_Append(self->added, obj) == -1)
298 if (PyList_Append(self->added, obj) == -1)
299 return NULL;
299 return NULL;
300
300
301 if (self->nt)
301 if (self->nt)
302 nt_insert(self, node, index);
302 nt_insert(self, node, index);
303
303
304 Py_CLEAR(self->headrevs);
304 Py_CLEAR(self->headrevs);
305 Py_RETURN_NONE;
305 Py_RETURN_NONE;
306 }
306 }
307
307
308 static void _index_clearcaches(indexObject *self)
308 static void _index_clearcaches(indexObject *self)
309 {
309 {
310 if (self->cache) {
310 if (self->cache) {
311 Py_ssize_t i;
311 Py_ssize_t i;
312
312
313 for (i = 0; i < self->raw_length; i++)
313 for (i = 0; i < self->raw_length; i++)
314 Py_CLEAR(self->cache[i]);
314 Py_CLEAR(self->cache[i]);
315 free(self->cache);
315 free(self->cache);
316 self->cache = NULL;
316 self->cache = NULL;
317 }
317 }
318 if (self->offsets) {
318 if (self->offsets) {
319 PyMem_Free(self->offsets);
319 PyMem_Free(self->offsets);
320 self->offsets = NULL;
320 self->offsets = NULL;
321 }
321 }
322 if (self->nt) {
322 if (self->nt) {
323 free(self->nt);
323 free(self->nt);
324 self->nt = NULL;
324 self->nt = NULL;
325 }
325 }
326 Py_CLEAR(self->headrevs);
326 Py_CLEAR(self->headrevs);
327 }
327 }
328
328
329 static PyObject *index_clearcaches(indexObject *self)
329 static PyObject *index_clearcaches(indexObject *self)
330 {
330 {
331 _index_clearcaches(self);
331 _index_clearcaches(self);
332 self->ntlength = self->ntcapacity = 0;
332 self->ntlength = self->ntcapacity = 0;
333 self->ntdepth = self->ntsplits = 0;
333 self->ntdepth = self->ntsplits = 0;
334 self->ntrev = -1;
334 self->ntrev = -1;
335 self->ntlookups = self->ntmisses = 0;
335 self->ntlookups = self->ntmisses = 0;
336 Py_RETURN_NONE;
336 Py_RETURN_NONE;
337 }
337 }
338
338
339 static PyObject *index_stats(indexObject *self)
339 static PyObject *index_stats(indexObject *self)
340 {
340 {
341 PyObject *obj = PyDict_New();
341 PyObject *obj = PyDict_New();
342 PyObject *t = NULL;
342 PyObject *t = NULL;
343
343
344 if (obj == NULL)
344 if (obj == NULL)
345 return NULL;
345 return NULL;
346
346
347 #define istat(__n, __d) \
347 #define istat(__n, __d) \
348 do { \
348 do { \
349 t = PyInt_FromSsize_t(self->__n); \
349 t = PyInt_FromSsize_t(self->__n); \
350 if (!t) \
350 if (!t) \
351 goto bail; \
351 goto bail; \
352 if (PyDict_SetItemString(obj, __d, t) == -1) \
352 if (PyDict_SetItemString(obj, __d, t) == -1) \
353 goto bail; \
353 goto bail; \
354 Py_DECREF(t); \
354 Py_DECREF(t); \
355 } while (0)
355 } while (0)
356
356
357 if (self->added) {
357 if (self->added) {
358 Py_ssize_t len = PyList_GET_SIZE(self->added);
358 Py_ssize_t len = PyList_GET_SIZE(self->added);
359 t = PyInt_FromSsize_t(len);
359 t = PyInt_FromSsize_t(len);
360 if (!t)
360 if (!t)
361 goto bail;
361 goto bail;
362 if (PyDict_SetItemString(obj, "index entries added", t) == -1)
362 if (PyDict_SetItemString(obj, "index entries added", t) == -1)
363 goto bail;
363 goto bail;
364 Py_DECREF(t);
364 Py_DECREF(t);
365 }
365 }
366
366
367 if (self->raw_length != self->length - 1)
367 if (self->raw_length != self->length - 1)
368 istat(raw_length, "revs on disk");
368 istat(raw_length, "revs on disk");
369 istat(length, "revs in memory");
369 istat(length, "revs in memory");
370 istat(ntcapacity, "node trie capacity");
370 istat(ntcapacity, "node trie capacity");
371 istat(ntdepth, "node trie depth");
371 istat(ntdepth, "node trie depth");
372 istat(ntlength, "node trie count");
372 istat(ntlength, "node trie count");
373 istat(ntlookups, "node trie lookups");
373 istat(ntlookups, "node trie lookups");
374 istat(ntmisses, "node trie misses");
374 istat(ntmisses, "node trie misses");
375 istat(ntrev, "node trie last rev scanned");
375 istat(ntrev, "node trie last rev scanned");
376 istat(ntsplits, "node trie splits");
376 istat(ntsplits, "node trie splits");
377
377
378 #undef istat
378 #undef istat
379
379
380 return obj;
380 return obj;
381
381
382 bail:
382 bail:
383 Py_XDECREF(obj);
383 Py_XDECREF(obj);
384 Py_XDECREF(t);
384 Py_XDECREF(t);
385 return NULL;
385 return NULL;
386 }
386 }
387
387
388 /*
388 /*
389 * When we cache a list, we want to be sure the caller can't mutate
389 * When we cache a list, we want to be sure the caller can't mutate
390 * the cached copy.
390 * the cached copy.
391 */
391 */
392 static PyObject *list_copy(PyObject *list)
392 static PyObject *list_copy(PyObject *list)
393 {
393 {
394 Py_ssize_t len = PyList_GET_SIZE(list);
394 Py_ssize_t len = PyList_GET_SIZE(list);
395 PyObject *newlist = PyList_New(len);
395 PyObject *newlist = PyList_New(len);
396 Py_ssize_t i;
396 Py_ssize_t i;
397
397
398 if (newlist == NULL)
398 if (newlist == NULL)
399 return NULL;
399 return NULL;
400
400
401 for (i = 0; i < len; i++) {
401 for (i = 0; i < len; i++) {
402 PyObject *obj = PyList_GET_ITEM(list, i);
402 PyObject *obj = PyList_GET_ITEM(list, i);
403 Py_INCREF(obj);
403 Py_INCREF(obj);
404 PyList_SET_ITEM(newlist, i, obj);
404 PyList_SET_ITEM(newlist, i, obj);
405 }
405 }
406
406
407 return newlist;
407 return newlist;
408 }
408 }
409
409
410 static int check_filter(PyObject *filter, Py_ssize_t arg) {
410 static int check_filter(PyObject *filter, Py_ssize_t arg) {
411 if (filter) {
411 if (filter) {
412 PyObject *arglist, *result;
412 PyObject *arglist, *result;
413 int isfiltered;
413 int isfiltered;
414
414
415 arglist = Py_BuildValue("(n)", arg);
415 arglist = Py_BuildValue("(n)", arg);
416 if (!arglist) {
416 if (!arglist) {
417 return -1;
417 return -1;
418 }
418 }
419
419
420 result = PyEval_CallObject(filter, arglist);
420 result = PyEval_CallObject(filter, arglist);
421 Py_DECREF(arglist);
421 Py_DECREF(arglist);
422 if (!result) {
422 if (!result) {
423 return -1;
423 return -1;
424 }
424 }
425
425
426 /* PyObject_IsTrue returns 1 if true, 0 if false, -1 if error,
426 /* PyObject_IsTrue returns 1 if true, 0 if false, -1 if error,
427 * same as this function, so we can just return it directly.*/
427 * same as this function, so we can just return it directly.*/
428 isfiltered = PyObject_IsTrue(result);
428 isfiltered = PyObject_IsTrue(result);
429 Py_DECREF(result);
429 Py_DECREF(result);
430 return isfiltered;
430 return isfiltered;
431 } else {
431 } else {
432 return 0;
432 return 0;
433 }
433 }
434 }
434 }
435
435
436 static Py_ssize_t add_roots_get_min(indexObject *self, PyObject *list,
436 static Py_ssize_t add_roots_get_min(indexObject *self, PyObject *list,
437 Py_ssize_t marker, char *phases)
437 Py_ssize_t marker, char *phases)
438 {
438 {
439 PyObject *iter = NULL;
439 PyObject *iter = NULL;
440 PyObject *iter_item = NULL;
440 PyObject *iter_item = NULL;
441 Py_ssize_t min_idx = index_length(self) + 1;
441 Py_ssize_t min_idx = index_length(self) + 1;
442 long iter_item_long;
442 long iter_item_long;
443
443
444 if (PyList_GET_SIZE(list) != 0) {
444 if (PyList_GET_SIZE(list) != 0) {
445 iter = PyObject_GetIter(list);
445 iter = PyObject_GetIter(list);
446 if (iter == NULL)
446 if (iter == NULL)
447 return -2;
447 return -2;
448 while ((iter_item = PyIter_Next(iter)))
448 while ((iter_item = PyIter_Next(iter))) {
449 {
450 iter_item_long = PyInt_AS_LONG(iter_item);
449 iter_item_long = PyInt_AS_LONG(iter_item);
451 Py_DECREF(iter_item);
450 Py_DECREF(iter_item);
452 if (iter_item_long < min_idx)
451 if (iter_item_long < min_idx)
453 min_idx = iter_item_long;
452 min_idx = iter_item_long;
454 phases[iter_item_long] = marker;
453 phases[iter_item_long] = marker;
455 }
454 }
456 Py_DECREF(iter);
455 Py_DECREF(iter);
457 }
456 }
458
457
459 return min_idx;
458 return min_idx;
460 }
459 }
461
460
462 static inline void set_phase_from_parents(char *phases, int parent_1,
461 static inline void set_phase_from_parents(char *phases, int parent_1,
463 int parent_2, Py_ssize_t i)
462 int parent_2, Py_ssize_t i)
464 {
463 {
465 if (parent_1 >= 0 && phases[parent_1] > phases[i])
464 if (parent_1 >= 0 && phases[parent_1] > phases[i])
466 phases[i] = phases[parent_1];
465 phases[i] = phases[parent_1];
467 if (parent_2 >= 0 && phases[parent_2] > phases[i])
466 if (parent_2 >= 0 && phases[parent_2] > phases[i])
468 phases[i] = phases[parent_2];
467 phases[i] = phases[parent_2];
469 }
468 }
470
469
471 static PyObject *reachableroots2(indexObject *self, PyObject *args)
470 static PyObject *reachableroots2(indexObject *self, PyObject *args)
472 {
471 {
473
472
474 /* Input */
473 /* Input */
475 long minroot;
474 long minroot;
476 PyObject *includepatharg = NULL;
475 PyObject *includepatharg = NULL;
477 int includepath = 0;
476 int includepath = 0;
478 /* heads and roots are lists */
477 /* heads and roots are lists */
479 PyObject *heads = NULL;
478 PyObject *heads = NULL;
480 PyObject *roots = NULL;
479 PyObject *roots = NULL;
481 PyObject *reachable = NULL;
480 PyObject *reachable = NULL;
482
481
483 PyObject *val;
482 PyObject *val;
484 Py_ssize_t len = index_length(self) - 1;
483 Py_ssize_t len = index_length(self) - 1;
485 long revnum;
484 long revnum;
486 Py_ssize_t k;
485 Py_ssize_t k;
487 Py_ssize_t i;
486 Py_ssize_t i;
488 Py_ssize_t l;
487 Py_ssize_t l;
489 int r;
488 int r;
490 int parents[2];
489 int parents[2];
491
490
492 /* Internal data structure:
491 /* Internal data structure:
493 * tovisit: array of length len+1 (all revs + nullrev), filled upto lentovisit
492 * tovisit: array of length len+1 (all revs + nullrev), filled upto lentovisit
494 * revstates: array of length len+1 (all revs + nullrev) */
493 * revstates: array of length len+1 (all revs + nullrev) */
495 int *tovisit = NULL;
494 int *tovisit = NULL;
496 long lentovisit = 0;
495 long lentovisit = 0;
497 enum { RS_SEEN = 1, RS_ROOT = 2, RS_REACHABLE = 4 };
496 enum { RS_SEEN = 1, RS_ROOT = 2, RS_REACHABLE = 4 };
498 char *revstates = NULL;
497 char *revstates = NULL;
499
498
500 /* Get arguments */
499 /* Get arguments */
501 if (!PyArg_ParseTuple(args, "lO!O!O!", &minroot, &PyList_Type, &heads,
500 if (!PyArg_ParseTuple(args, "lO!O!O!", &minroot, &PyList_Type, &heads,
502 &PyList_Type, &roots,
501 &PyList_Type, &roots,
503 &PyBool_Type, &includepatharg))
502 &PyBool_Type, &includepatharg))
504 goto bail;
503 goto bail;
505
504
506 if (includepatharg == Py_True)
505 if (includepatharg == Py_True)
507 includepath = 1;
506 includepath = 1;
508
507
509 /* Initialize return set */
508 /* Initialize return set */
510 reachable = PyList_New(0);
509 reachable = PyList_New(0);
511 if (reachable == NULL)
510 if (reachable == NULL)
512 goto bail;
511 goto bail;
513
512
514 /* Initialize internal datastructures */
513 /* Initialize internal datastructures */
515 tovisit = (int *)malloc((len + 1) * sizeof(int));
514 tovisit = (int *)malloc((len + 1) * sizeof(int));
516 if (tovisit == NULL) {
515 if (tovisit == NULL) {
517 PyErr_NoMemory();
516 PyErr_NoMemory();
518 goto bail;
517 goto bail;
519 }
518 }
520
519
521 revstates = (char *)calloc(len + 1, 1);
520 revstates = (char *)calloc(len + 1, 1);
522 if (revstates == NULL) {
521 if (revstates == NULL) {
523 PyErr_NoMemory();
522 PyErr_NoMemory();
524 goto bail;
523 goto bail;
525 }
524 }
526
525
527 l = PyList_GET_SIZE(roots);
526 l = PyList_GET_SIZE(roots);
528 for (i = 0; i < l; i++) {
527 for (i = 0; i < l; i++) {
529 revnum = PyInt_AsLong(PyList_GET_ITEM(roots, i));
528 revnum = PyInt_AsLong(PyList_GET_ITEM(roots, i));
530 if (revnum == -1 && PyErr_Occurred())
529 if (revnum == -1 && PyErr_Occurred())
531 goto bail;
530 goto bail;
532 /* If root is out of range, e.g. wdir(), it must be unreachable
531 /* If root is out of range, e.g. wdir(), it must be unreachable
533 * from heads. So we can just ignore it. */
532 * from heads. So we can just ignore it. */
534 if (revnum + 1 < 0 || revnum + 1 >= len + 1)
533 if (revnum + 1 < 0 || revnum + 1 >= len + 1)
535 continue;
534 continue;
536 revstates[revnum + 1] |= RS_ROOT;
535 revstates[revnum + 1] |= RS_ROOT;
537 }
536 }
538
537
539 /* Populate tovisit with all the heads */
538 /* Populate tovisit with all the heads */
540 l = PyList_GET_SIZE(heads);
539 l = PyList_GET_SIZE(heads);
541 for (i = 0; i < l; i++) {
540 for (i = 0; i < l; i++) {
542 revnum = PyInt_AsLong(PyList_GET_ITEM(heads, i));
541 revnum = PyInt_AsLong(PyList_GET_ITEM(heads, i));
543 if (revnum == -1 && PyErr_Occurred())
542 if (revnum == -1 && PyErr_Occurred())
544 goto bail;
543 goto bail;
545 if (revnum + 1 < 0 || revnum + 1 >= len + 1) {
544 if (revnum + 1 < 0 || revnum + 1 >= len + 1) {
546 PyErr_SetString(PyExc_IndexError, "head out of range");
545 PyErr_SetString(PyExc_IndexError, "head out of range");
547 goto bail;
546 goto bail;
548 }
547 }
549 if (!(revstates[revnum + 1] & RS_SEEN)) {
548 if (!(revstates[revnum + 1] & RS_SEEN)) {
550 tovisit[lentovisit++] = (int)revnum;
549 tovisit[lentovisit++] = (int)revnum;
551 revstates[revnum + 1] |= RS_SEEN;
550 revstates[revnum + 1] |= RS_SEEN;
552 }
551 }
553 }
552 }
554
553
555 /* Visit the tovisit list and find the reachable roots */
554 /* Visit the tovisit list and find the reachable roots */
556 k = 0;
555 k = 0;
557 while (k < lentovisit) {
556 while (k < lentovisit) {
558 /* Add the node to reachable if it is a root*/
557 /* Add the node to reachable if it is a root*/
559 revnum = tovisit[k++];
558 revnum = tovisit[k++];
560 if (revstates[revnum + 1] & RS_ROOT) {
559 if (revstates[revnum + 1] & RS_ROOT) {
561 revstates[revnum + 1] |= RS_REACHABLE;
560 revstates[revnum + 1] |= RS_REACHABLE;
562 val = PyInt_FromLong(revnum);
561 val = PyInt_FromLong(revnum);
563 if (val == NULL)
562 if (val == NULL)
564 goto bail;
563 goto bail;
565 r = PyList_Append(reachable, val);
564 r = PyList_Append(reachable, val);
566 Py_DECREF(val);
565 Py_DECREF(val);
567 if (r < 0)
566 if (r < 0)
568 goto bail;
567 goto bail;
569 if (includepath == 0)
568 if (includepath == 0)
570 continue;
569 continue;
571 }
570 }
572
571
573 /* Add its parents to the list of nodes to visit */
572 /* Add its parents to the list of nodes to visit */
574 if (revnum == -1)
573 if (revnum == -1)
575 continue;
574 continue;
576 r = index_get_parents(self, revnum, parents, (int)len - 1);
575 r = index_get_parents(self, revnum, parents, (int)len - 1);
577 if (r < 0)
576 if (r < 0)
578 goto bail;
577 goto bail;
579 for (i = 0; i < 2; i++) {
578 for (i = 0; i < 2; i++) {
580 if (!(revstates[parents[i] + 1] & RS_SEEN)
579 if (!(revstates[parents[i] + 1] & RS_SEEN)
581 && parents[i] >= minroot) {
580 && parents[i] >= minroot) {
582 tovisit[lentovisit++] = parents[i];
581 tovisit[lentovisit++] = parents[i];
583 revstates[parents[i] + 1] |= RS_SEEN;
582 revstates[parents[i] + 1] |= RS_SEEN;
584 }
583 }
585 }
584 }
586 }
585 }
587
586
588 /* Find all the nodes in between the roots we found and the heads
587 /* Find all the nodes in between the roots we found and the heads
589 * and add them to the reachable set */
588 * and add them to the reachable set */
590 if (includepath == 1) {
589 if (includepath == 1) {
591 long minidx = minroot;
590 long minidx = minroot;
592 if (minidx < 0)
591 if (minidx < 0)
593 minidx = 0;
592 minidx = 0;
594 for (i = minidx; i < len; i++) {
593 for (i = minidx; i < len; i++) {
595 if (!(revstates[i + 1] & RS_SEEN))
594 if (!(revstates[i + 1] & RS_SEEN))
596 continue;
595 continue;
597 r = index_get_parents(self, i, parents, (int)len - 1);
596 r = index_get_parents(self, i, parents, (int)len - 1);
598 /* Corrupted index file, error is set from
597 /* Corrupted index file, error is set from
599 * index_get_parents */
598 * index_get_parents */
600 if (r < 0)
599 if (r < 0)
601 goto bail;
600 goto bail;
602 if (((revstates[parents[0] + 1] |
601 if (((revstates[parents[0] + 1] |
603 revstates[parents[1] + 1]) & RS_REACHABLE)
602 revstates[parents[1] + 1]) & RS_REACHABLE)
604 && !(revstates[i + 1] & RS_REACHABLE)) {
603 && !(revstates[i + 1] & RS_REACHABLE)) {
605 revstates[i + 1] |= RS_REACHABLE;
604 revstates[i + 1] |= RS_REACHABLE;
606 val = PyInt_FromLong(i);
605 val = PyInt_FromLong(i);
607 if (val == NULL)
606 if (val == NULL)
608 goto bail;
607 goto bail;
609 r = PyList_Append(reachable, val);
608 r = PyList_Append(reachable, val);
610 Py_DECREF(val);
609 Py_DECREF(val);
611 if (r < 0)
610 if (r < 0)
612 goto bail;
611 goto bail;
613 }
612 }
614 }
613 }
615 }
614 }
616
615
617 free(revstates);
616 free(revstates);
618 free(tovisit);
617 free(tovisit);
619 return reachable;
618 return reachable;
620 bail:
619 bail:
621 Py_XDECREF(reachable);
620 Py_XDECREF(reachable);
622 free(revstates);
621 free(revstates);
623 free(tovisit);
622 free(tovisit);
624 return NULL;
623 return NULL;
625 }
624 }
626
625
627 static PyObject *compute_phases_map_sets(indexObject *self, PyObject *args)
626 static PyObject *compute_phases_map_sets(indexObject *self, PyObject *args)
628 {
627 {
629 PyObject *roots = Py_None;
628 PyObject *roots = Py_None;
630 PyObject *ret = NULL;
629 PyObject *ret = NULL;
631 PyObject *phaseslist = NULL;
630 PyObject *phaseslist = NULL;
632 PyObject *phaseroots = NULL;
631 PyObject *phaseroots = NULL;
633 PyObject *phaseset = NULL;
632 PyObject *phaseset = NULL;
634 PyObject *phasessetlist = NULL;
633 PyObject *phasessetlist = NULL;
635 PyObject *rev = NULL;
634 PyObject *rev = NULL;
636 Py_ssize_t len = index_length(self) - 1;
635 Py_ssize_t len = index_length(self) - 1;
637 Py_ssize_t numphase = 0;
636 Py_ssize_t numphase = 0;
638 Py_ssize_t minrevallphases = 0;
637 Py_ssize_t minrevallphases = 0;
639 Py_ssize_t minrevphase = 0;
638 Py_ssize_t minrevphase = 0;
640 Py_ssize_t i = 0;
639 Py_ssize_t i = 0;
641 char *phases = NULL;
640 char *phases = NULL;
642 long phase;
641 long phase;
643
642
644 if (!PyArg_ParseTuple(args, "O", &roots))
643 if (!PyArg_ParseTuple(args, "O", &roots))
645 goto done;
644 goto done;
646 if (roots == NULL || !PyList_Check(roots))
645 if (roots == NULL || !PyList_Check(roots))
647 goto done;
646 goto done;
648
647
649 phases = calloc(len, 1); /* phase per rev: {0: public, 1: draft, 2: secret} */
648 phases = calloc(len, 1); /* phase per rev: {0: public, 1: draft, 2: secret} */
650 if (phases == NULL) {
649 if (phases == NULL) {
651 PyErr_NoMemory();
650 PyErr_NoMemory();
652 goto done;
651 goto done;
653 }
652 }
654 /* Put the phase information of all the roots in phases */
653 /* Put the phase information of all the roots in phases */
655 numphase = PyList_GET_SIZE(roots)+1;
654 numphase = PyList_GET_SIZE(roots)+1;
656 minrevallphases = len + 1;
655 minrevallphases = len + 1;
657 phasessetlist = PyList_New(numphase);
656 phasessetlist = PyList_New(numphase);
658 if (phasessetlist == NULL)
657 if (phasessetlist == NULL)
659 goto done;
658 goto done;
660
659
661 PyList_SET_ITEM(phasessetlist, 0, Py_None);
660 PyList_SET_ITEM(phasessetlist, 0, Py_None);
662 Py_INCREF(Py_None);
661 Py_INCREF(Py_None);
663
662
664 for (i = 0; i < numphase-1; i++) {
663 for (i = 0; i < numphase-1; i++) {
665 phaseroots = PyList_GET_ITEM(roots, i);
664 phaseroots = PyList_GET_ITEM(roots, i);
666 phaseset = PySet_New(NULL);
665 phaseset = PySet_New(NULL);
667 if (phaseset == NULL)
666 if (phaseset == NULL)
668 goto release;
667 goto release;
669 PyList_SET_ITEM(phasessetlist, i+1, phaseset);
668 PyList_SET_ITEM(phasessetlist, i+1, phaseset);
670 if (!PyList_Check(phaseroots))
669 if (!PyList_Check(phaseroots))
671 goto release;
670 goto release;
672 minrevphase = add_roots_get_min(self, phaseroots, i+1, phases);
671 minrevphase = add_roots_get_min(self, phaseroots, i+1, phases);
673 if (minrevphase == -2) /* Error from add_roots_get_min */
672 if (minrevphase == -2) /* Error from add_roots_get_min */
674 goto release;
673 goto release;
675 minrevallphases = MIN(minrevallphases, minrevphase);
674 minrevallphases = MIN(minrevallphases, minrevphase);
676 }
675 }
677 /* Propagate the phase information from the roots to the revs */
676 /* Propagate the phase information from the roots to the revs */
678 if (minrevallphases != -1) {
677 if (minrevallphases != -1) {
679 int parents[2];
678 int parents[2];
680 for (i = minrevallphases; i < len; i++) {
679 for (i = minrevallphases; i < len; i++) {
681 if (index_get_parents(self, i, parents,
680 if (index_get_parents(self, i, parents,
682 (int)len - 1) < 0)
681 (int)len - 1) < 0)
683 goto release;
682 goto release;
684 set_phase_from_parents(phases, parents[0], parents[1], i);
683 set_phase_from_parents(phases, parents[0], parents[1], i);
685 }
684 }
686 }
685 }
687 /* Transform phase list to a python list */
686 /* Transform phase list to a python list */
688 phaseslist = PyList_New(len);
687 phaseslist = PyList_New(len);
689 if (phaseslist == NULL)
688 if (phaseslist == NULL)
690 goto release;
689 goto release;
691 for (i = 0; i < len; i++) {
690 for (i = 0; i < len; i++) {
692 PyObject *phaseval;
691 PyObject *phaseval;
693
692
694 phase = phases[i];
693 phase = phases[i];
695 /* We only store the sets of phase for non public phase, the public phase
694 /* We only store the sets of phase for non public phase, the public phase
696 * is computed as a difference */
695 * is computed as a difference */
697 if (phase != 0) {
696 if (phase != 0) {
698 phaseset = PyList_GET_ITEM(phasessetlist, phase);
697 phaseset = PyList_GET_ITEM(phasessetlist, phase);
699 rev = PyInt_FromLong(i);
698 rev = PyInt_FromLong(i);
700 if (rev == NULL)
699 if (rev == NULL)
701 goto release;
700 goto release;
702 PySet_Add(phaseset, rev);
701 PySet_Add(phaseset, rev);
703 Py_XDECREF(rev);
702 Py_XDECREF(rev);
704 }
703 }
705 phaseval = PyInt_FromLong(phase);
704 phaseval = PyInt_FromLong(phase);
706 if (phaseval == NULL)
705 if (phaseval == NULL)
707 goto release;
706 goto release;
708 PyList_SET_ITEM(phaseslist, i, phaseval);
707 PyList_SET_ITEM(phaseslist, i, phaseval);
709 }
708 }
710 ret = PyTuple_Pack(2, phaseslist, phasessetlist);
709 ret = PyTuple_Pack(2, phaseslist, phasessetlist);
711
710
712 release:
711 release:
713 Py_XDECREF(phaseslist);
712 Py_XDECREF(phaseslist);
714 Py_XDECREF(phasessetlist);
713 Py_XDECREF(phasessetlist);
715 done:
714 done:
716 free(phases);
715 free(phases);
717 return ret;
716 return ret;
718 }
717 }
719
718
720 static PyObject *index_headrevs(indexObject *self, PyObject *args)
719 static PyObject *index_headrevs(indexObject *self, PyObject *args)
721 {
720 {
722 Py_ssize_t i, j, len;
721 Py_ssize_t i, j, len;
723 char *nothead = NULL;
722 char *nothead = NULL;
724 PyObject *heads = NULL;
723 PyObject *heads = NULL;
725 PyObject *filter = NULL;
724 PyObject *filter = NULL;
726 PyObject *filteredrevs = Py_None;
725 PyObject *filteredrevs = Py_None;
727
726
728 if (!PyArg_ParseTuple(args, "|O", &filteredrevs)) {
727 if (!PyArg_ParseTuple(args, "|O", &filteredrevs)) {
729 return NULL;
728 return NULL;
730 }
729 }
731
730
732 if (self->headrevs && filteredrevs == self->filteredrevs)
731 if (self->headrevs && filteredrevs == self->filteredrevs)
733 return list_copy(self->headrevs);
732 return list_copy(self->headrevs);
734
733
735 Py_DECREF(self->filteredrevs);
734 Py_DECREF(self->filteredrevs);
736 self->filteredrevs = filteredrevs;
735 self->filteredrevs = filteredrevs;
737 Py_INCREF(filteredrevs);
736 Py_INCREF(filteredrevs);
738
737
739 if (filteredrevs != Py_None) {
738 if (filteredrevs != Py_None) {
740 filter = PyObject_GetAttrString(filteredrevs, "__contains__");
739 filter = PyObject_GetAttrString(filteredrevs, "__contains__");
741 if (!filter) {
740 if (!filter) {
742 PyErr_SetString(PyExc_TypeError,
741 PyErr_SetString(PyExc_TypeError,
743 "filteredrevs has no attribute __contains__");
742 "filteredrevs has no attribute __contains__");
744 goto bail;
743 goto bail;
745 }
744 }
746 }
745 }
747
746
748 len = index_length(self) - 1;
747 len = index_length(self) - 1;
749 heads = PyList_New(0);
748 heads = PyList_New(0);
750 if (heads == NULL)
749 if (heads == NULL)
751 goto bail;
750 goto bail;
752 if (len == 0) {
751 if (len == 0) {
753 PyObject *nullid = PyInt_FromLong(-1);
752 PyObject *nullid = PyInt_FromLong(-1);
754 if (nullid == NULL || PyList_Append(heads, nullid) == -1) {
753 if (nullid == NULL || PyList_Append(heads, nullid) == -1) {
755 Py_XDECREF(nullid);
754 Py_XDECREF(nullid);
756 goto bail;
755 goto bail;
757 }
756 }
758 goto done;
757 goto done;
759 }
758 }
760
759
761 nothead = calloc(len, 1);
760 nothead = calloc(len, 1);
762 if (nothead == NULL) {
761 if (nothead == NULL) {
763 PyErr_NoMemory();
762 PyErr_NoMemory();
764 goto bail;
763 goto bail;
765 }
764 }
766
765
767 for (i = len - 1; i >= 0; i--) {
766 for (i = len - 1; i >= 0; i--) {
768 int isfiltered;
767 int isfiltered;
769 int parents[2];
768 int parents[2];
770
769
771 /* If nothead[i] == 1, it means we've seen an unfiltered child of this
770 /* If nothead[i] == 1, it means we've seen an unfiltered child of this
772 * node already, and therefore this node is not filtered. So we can skip
771 * node already, and therefore this node is not filtered. So we can skip
773 * the expensive check_filter step.
772 * the expensive check_filter step.
774 */
773 */
775 if (nothead[i] != 1) {
774 if (nothead[i] != 1) {
776 isfiltered = check_filter(filter, i);
775 isfiltered = check_filter(filter, i);
777 if (isfiltered == -1) {
776 if (isfiltered == -1) {
778 PyErr_SetString(PyExc_TypeError,
777 PyErr_SetString(PyExc_TypeError,
779 "unable to check filter");
778 "unable to check filter");
780 goto bail;
779 goto bail;
781 }
780 }
782
781
783 if (isfiltered) {
782 if (isfiltered) {
784 nothead[i] = 1;
783 nothead[i] = 1;
785 continue;
784 continue;
786 }
785 }
787 }
786 }
788
787
789 if (index_get_parents(self, i, parents, (int)len - 1) < 0)
788 if (index_get_parents(self, i, parents, (int)len - 1) < 0)
790 goto bail;
789 goto bail;
791 for (j = 0; j < 2; j++) {
790 for (j = 0; j < 2; j++) {
792 if (parents[j] >= 0)
791 if (parents[j] >= 0)
793 nothead[parents[j]] = 1;
792 nothead[parents[j]] = 1;
794 }
793 }
795 }
794 }
796
795
797 for (i = 0; i < len; i++) {
796 for (i = 0; i < len; i++) {
798 PyObject *head;
797 PyObject *head;
799
798
800 if (nothead[i])
799 if (nothead[i])
801 continue;
800 continue;
802 head = PyInt_FromSsize_t(i);
801 head = PyInt_FromSsize_t(i);
803 if (head == NULL || PyList_Append(heads, head) == -1) {
802 if (head == NULL || PyList_Append(heads, head) == -1) {
804 Py_XDECREF(head);
803 Py_XDECREF(head);
805 goto bail;
804 goto bail;
806 }
805 }
807 }
806 }
808
807
809 done:
808 done:
810 self->headrevs = heads;
809 self->headrevs = heads;
811 Py_XDECREF(filter);
810 Py_XDECREF(filter);
812 free(nothead);
811 free(nothead);
813 return list_copy(self->headrevs);
812 return list_copy(self->headrevs);
814 bail:
813 bail:
815 Py_XDECREF(filter);
814 Py_XDECREF(filter);
816 Py_XDECREF(heads);
815 Py_XDECREF(heads);
817 free(nothead);
816 free(nothead);
818 return NULL;
817 return NULL;
819 }
818 }
820
819
821 /**
820 /**
822 * Obtain the base revision index entry.
821 * Obtain the base revision index entry.
823 *
822 *
824 * Callers must ensure that rev >= 0 or illegal memory access may occur.
823 * Callers must ensure that rev >= 0 or illegal memory access may occur.
825 */
824 */
826 static inline int index_baserev(indexObject *self, int rev)
825 static inline int index_baserev(indexObject *self, int rev)
827 {
826 {
828 const char *data;
827 const char *data;
829
828
830 if (rev >= self->length - 1) {
829 if (rev >= self->length - 1) {
831 PyObject *tuple = PyList_GET_ITEM(self->added,
830 PyObject *tuple = PyList_GET_ITEM(self->added,
832 rev - self->length + 1);
831 rev - self->length + 1);
833 return (int)PyInt_AS_LONG(PyTuple_GET_ITEM(tuple, 3));
832 return (int)PyInt_AS_LONG(PyTuple_GET_ITEM(tuple, 3));
834 }
833 }
835 else {
834 else {
836 data = index_deref(self, rev);
835 data = index_deref(self, rev);
837 if (data == NULL) {
836 if (data == NULL) {
838 return -2;
837 return -2;
839 }
838 }
840
839
841 return getbe32(data + 16);
840 return getbe32(data + 16);
842 }
841 }
843 }
842 }
844
843
845 static PyObject *index_deltachain(indexObject *self, PyObject *args)
844 static PyObject *index_deltachain(indexObject *self, PyObject *args)
846 {
845 {
847 int rev, generaldelta;
846 int rev, generaldelta;
848 PyObject *stoparg;
847 PyObject *stoparg;
849 int stoprev, iterrev, baserev = -1;
848 int stoprev, iterrev, baserev = -1;
850 int stopped;
849 int stopped;
851 PyObject *chain = NULL, *result = NULL;
850 PyObject *chain = NULL, *result = NULL;
852 const Py_ssize_t length = index_length(self);
851 const Py_ssize_t length = index_length(self);
853
852
854 if (!PyArg_ParseTuple(args, "iOi", &rev, &stoparg, &generaldelta)) {
853 if (!PyArg_ParseTuple(args, "iOi", &rev, &stoparg, &generaldelta)) {
855 return NULL;
854 return NULL;
856 }
855 }
857
856
858 if (PyInt_Check(stoparg)) {
857 if (PyInt_Check(stoparg)) {
859 stoprev = (int)PyInt_AsLong(stoparg);
858 stoprev = (int)PyInt_AsLong(stoparg);
860 if (stoprev == -1 && PyErr_Occurred()) {
859 if (stoprev == -1 && PyErr_Occurred()) {
861 return NULL;
860 return NULL;
862 }
861 }
863 }
862 }
864 else if (stoparg == Py_None) {
863 else if (stoparg == Py_None) {
865 stoprev = -2;
864 stoprev = -2;
866 }
865 }
867 else {
866 else {
868 PyErr_SetString(PyExc_ValueError,
867 PyErr_SetString(PyExc_ValueError,
869 "stoprev must be integer or None");
868 "stoprev must be integer or None");
870 return NULL;
869 return NULL;
871 }
870 }
872
871
873 if (rev < 0 || rev >= length - 1) {
872 if (rev < 0 || rev >= length - 1) {
874 PyErr_SetString(PyExc_ValueError, "revlog index out of range");
873 PyErr_SetString(PyExc_ValueError, "revlog index out of range");
875 return NULL;
874 return NULL;
876 }
875 }
877
876
878 chain = PyList_New(0);
877 chain = PyList_New(0);
879 if (chain == NULL) {
878 if (chain == NULL) {
880 return NULL;
879 return NULL;
881 }
880 }
882
881
883 baserev = index_baserev(self, rev);
882 baserev = index_baserev(self, rev);
884
883
885 /* This should never happen. */
884 /* This should never happen. */
886 if (baserev <= -2) {
885 if (baserev <= -2) {
887 /* Error should be set by index_deref() */
886 /* Error should be set by index_deref() */
888 assert(PyErr_Occurred());
887 assert(PyErr_Occurred());
889 goto bail;
888 goto bail;
890 }
889 }
891
890
892 iterrev = rev;
891 iterrev = rev;
893
892
894 while (iterrev != baserev && iterrev != stoprev) {
893 while (iterrev != baserev && iterrev != stoprev) {
895 PyObject *value = PyInt_FromLong(iterrev);
894 PyObject *value = PyInt_FromLong(iterrev);
896 if (value == NULL) {
895 if (value == NULL) {
897 goto bail;
896 goto bail;
898 }
897 }
899 if (PyList_Append(chain, value)) {
898 if (PyList_Append(chain, value)) {
900 Py_DECREF(value);
899 Py_DECREF(value);
901 goto bail;
900 goto bail;
902 }
901 }
903 Py_DECREF(value);
902 Py_DECREF(value);
904
903
905 if (generaldelta) {
904 if (generaldelta) {
906 iterrev = baserev;
905 iterrev = baserev;
907 }
906 }
908 else {
907 else {
909 iterrev--;
908 iterrev--;
910 }
909 }
911
910
912 if (iterrev < 0) {
911 if (iterrev < 0) {
913 break;
912 break;
914 }
913 }
915
914
916 if (iterrev >= length - 1) {
915 if (iterrev >= length - 1) {
917 PyErr_SetString(PyExc_IndexError, "revision outside index");
916 PyErr_SetString(PyExc_IndexError, "revision outside index");
918 return NULL;
917 return NULL;
919 }
918 }
920
919
921 baserev = index_baserev(self, iterrev);
920 baserev = index_baserev(self, iterrev);
922
921
923 /* This should never happen. */
922 /* This should never happen. */
924 if (baserev <= -2) {
923 if (baserev <= -2) {
925 /* Error should be set by index_deref() */
924 /* Error should be set by index_deref() */
926 assert(PyErr_Occurred());
925 assert(PyErr_Occurred());
927 goto bail;
926 goto bail;
928 }
927 }
929 }
928 }
930
929
931 if (iterrev == stoprev) {
930 if (iterrev == stoprev) {
932 stopped = 1;
931 stopped = 1;
933 }
932 }
934 else {
933 else {
935 PyObject *value = PyInt_FromLong(iterrev);
934 PyObject *value = PyInt_FromLong(iterrev);
936 if (value == NULL) {
935 if (value == NULL) {
937 goto bail;
936 goto bail;
938 }
937 }
939 if (PyList_Append(chain, value)) {
938 if (PyList_Append(chain, value)) {
940 Py_DECREF(value);
939 Py_DECREF(value);
941 goto bail;
940 goto bail;
942 }
941 }
943 Py_DECREF(value);
942 Py_DECREF(value);
944
943
945 stopped = 0;
944 stopped = 0;
946 }
945 }
947
946
948 if (PyList_Reverse(chain)) {
947 if (PyList_Reverse(chain)) {
949 goto bail;
948 goto bail;
950 }
949 }
951
950
952 result = Py_BuildValue("OO", chain, stopped ? Py_True : Py_False);
951 result = Py_BuildValue("OO", chain, stopped ? Py_True : Py_False);
953 Py_DECREF(chain);
952 Py_DECREF(chain);
954 return result;
953 return result;
955
954
956 bail:
955 bail:
957 Py_DECREF(chain);
956 Py_DECREF(chain);
958 return NULL;
957 return NULL;
959 }
958 }
960
959
961 static inline int nt_level(const char *node, Py_ssize_t level)
960 static inline int nt_level(const char *node, Py_ssize_t level)
962 {
961 {
963 int v = node[level>>1];
962 int v = node[level>>1];
964 if (!(level & 1))
963 if (!(level & 1))
965 v >>= 4;
964 v >>= 4;
966 return v & 0xf;
965 return v & 0xf;
967 }
966 }
968
967
969 /*
968 /*
970 * Return values:
969 * Return values:
971 *
970 *
972 * -4: match is ambiguous (multiple candidates)
971 * -4: match is ambiguous (multiple candidates)
973 * -2: not found
972 * -2: not found
974 * rest: valid rev
973 * rest: valid rev
975 */
974 */
976 static int nt_find(indexObject *self, const char *node, Py_ssize_t nodelen,
975 static int nt_find(indexObject *self, const char *node, Py_ssize_t nodelen,
977 int hex)
976 int hex)
978 {
977 {
979 int (*getnybble)(const char *, Py_ssize_t) = hex ? hexdigit : nt_level;
978 int (*getnybble)(const char *, Py_ssize_t) = hex ? hexdigit : nt_level;
980 int level, maxlevel, off;
979 int level, maxlevel, off;
981
980
982 if (nodelen == 20 && node[0] == '\0' && memcmp(node, nullid, 20) == 0)
981 if (nodelen == 20 && node[0] == '\0' && memcmp(node, nullid, 20) == 0)
983 return -1;
982 return -1;
984
983
985 if (self->nt == NULL)
984 if (self->nt == NULL)
986 return -2;
985 return -2;
987
986
988 if (hex)
987 if (hex)
989 maxlevel = nodelen > 40 ? 40 : (int)nodelen;
988 maxlevel = nodelen > 40 ? 40 : (int)nodelen;
990 else
989 else
991 maxlevel = nodelen > 20 ? 40 : ((int)nodelen * 2);
990 maxlevel = nodelen > 20 ? 40 : ((int)nodelen * 2);
992
991
993 for (level = off = 0; level < maxlevel; level++) {
992 for (level = off = 0; level < maxlevel; level++) {
994 int k = getnybble(node, level);
993 int k = getnybble(node, level);
995 nodetree *n = &self->nt[off];
994 nodetree *n = &self->nt[off];
996 int v = n->children[k];
995 int v = n->children[k];
997
996
998 if (v < 0) {
997 if (v < 0) {
999 const char *n;
998 const char *n;
1000 Py_ssize_t i;
999 Py_ssize_t i;
1001
1000
1002 v = -(v + 1);
1001 v = -(v + 1);
1003 n = index_node(self, v);
1002 n = index_node(self, v);
1004 if (n == NULL)
1003 if (n == NULL)
1005 return -2;
1004 return -2;
1006 for (i = level; i < maxlevel; i++)
1005 for (i = level; i < maxlevel; i++)
1007 if (getnybble(node, i) != nt_level(n, i))
1006 if (getnybble(node, i) != nt_level(n, i))
1008 return -2;
1007 return -2;
1009 return v;
1008 return v;
1010 }
1009 }
1011 if (v == 0)
1010 if (v == 0)
1012 return -2;
1011 return -2;
1013 off = v;
1012 off = v;
1014 }
1013 }
1015 /* multiple matches against an ambiguous prefix */
1014 /* multiple matches against an ambiguous prefix */
1016 return -4;
1015 return -4;
1017 }
1016 }
1018
1017
1019 static int nt_new(indexObject *self)
1018 static int nt_new(indexObject *self)
1020 {
1019 {
1021 if (self->ntlength == self->ntcapacity) {
1020 if (self->ntlength == self->ntcapacity) {
1022 if (self->ntcapacity >= INT_MAX / (sizeof(nodetree) * 2)) {
1021 if (self->ntcapacity >= INT_MAX / (sizeof(nodetree) * 2)) {
1023 PyErr_SetString(PyExc_MemoryError,
1022 PyErr_SetString(PyExc_MemoryError,
1024 "overflow in nt_new");
1023 "overflow in nt_new");
1025 return -1;
1024 return -1;
1026 }
1025 }
1027 self->ntcapacity *= 2;
1026 self->ntcapacity *= 2;
1028 self->nt = realloc(self->nt,
1027 self->nt = realloc(self->nt,
1029 self->ntcapacity * sizeof(nodetree));
1028 self->ntcapacity * sizeof(nodetree));
1030 if (self->nt == NULL) {
1029 if (self->nt == NULL) {
1031 PyErr_SetString(PyExc_MemoryError, "out of memory");
1030 PyErr_SetString(PyExc_MemoryError, "out of memory");
1032 return -1;
1031 return -1;
1033 }
1032 }
1034 memset(&self->nt[self->ntlength], 0,
1033 memset(&self->nt[self->ntlength], 0,
1035 sizeof(nodetree) * (self->ntcapacity - self->ntlength));
1034 sizeof(nodetree) * (self->ntcapacity - self->ntlength));
1036 }
1035 }
1037 return self->ntlength++;
1036 return self->ntlength++;
1038 }
1037 }
1039
1038
1040 static int nt_insert(indexObject *self, const char *node, int rev)
1039 static int nt_insert(indexObject *self, const char *node, int rev)
1041 {
1040 {
1042 int level = 0;
1041 int level = 0;
1043 int off = 0;
1042 int off = 0;
1044
1043
1045 while (level < 40) {
1044 while (level < 40) {
1046 int k = nt_level(node, level);
1045 int k = nt_level(node, level);
1047 nodetree *n;
1046 nodetree *n;
1048 int v;
1047 int v;
1049
1048
1050 n = &self->nt[off];
1049 n = &self->nt[off];
1051 v = n->children[k];
1050 v = n->children[k];
1052
1051
1053 if (v == 0) {
1052 if (v == 0) {
1054 n->children[k] = -rev - 1;
1053 n->children[k] = -rev - 1;
1055 return 0;
1054 return 0;
1056 }
1055 }
1057 if (v < 0) {
1056 if (v < 0) {
1058 const char *oldnode = index_node(self, -(v + 1));
1057 const char *oldnode = index_node(self, -(v + 1));
1059 int noff;
1058 int noff;
1060
1059
1061 if (!oldnode || !memcmp(oldnode, node, 20)) {
1060 if (!oldnode || !memcmp(oldnode, node, 20)) {
1062 n->children[k] = -rev - 1;
1061 n->children[k] = -rev - 1;
1063 return 0;
1062 return 0;
1064 }
1063 }
1065 noff = nt_new(self);
1064 noff = nt_new(self);
1066 if (noff == -1)
1065 if (noff == -1)
1067 return -1;
1066 return -1;
1068 /* self->nt may have been changed by realloc */
1067 /* self->nt may have been changed by realloc */
1069 self->nt[off].children[k] = noff;
1068 self->nt[off].children[k] = noff;
1070 off = noff;
1069 off = noff;
1071 n = &self->nt[off];
1070 n = &self->nt[off];
1072 n->children[nt_level(oldnode, ++level)] = v;
1071 n->children[nt_level(oldnode, ++level)] = v;
1073 if (level > self->ntdepth)
1072 if (level > self->ntdepth)
1074 self->ntdepth = level;
1073 self->ntdepth = level;
1075 self->ntsplits += 1;
1074 self->ntsplits += 1;
1076 } else {
1075 } else {
1077 level += 1;
1076 level += 1;
1078 off = v;
1077 off = v;
1079 }
1078 }
1080 }
1079 }
1081
1080
1082 return -1;
1081 return -1;
1083 }
1082 }
1084
1083
1085 static int nt_init(indexObject *self)
1084 static int nt_init(indexObject *self)
1086 {
1085 {
1087 if (self->nt == NULL) {
1086 if (self->nt == NULL) {
1088 if ((size_t)self->raw_length > INT_MAX / sizeof(nodetree)) {
1087 if ((size_t)self->raw_length > INT_MAX / sizeof(nodetree)) {
1089 PyErr_SetString(PyExc_ValueError, "overflow in nt_init");
1088 PyErr_SetString(PyExc_ValueError, "overflow in nt_init");
1090 return -1;
1089 return -1;
1091 }
1090 }
1092 self->ntcapacity = self->raw_length < 4
1091 self->ntcapacity = self->raw_length < 4
1093 ? 4 : (int)self->raw_length / 2;
1092 ? 4 : (int)self->raw_length / 2;
1094
1093
1095 self->nt = calloc(self->ntcapacity, sizeof(nodetree));
1094 self->nt = calloc(self->ntcapacity, sizeof(nodetree));
1096 if (self->nt == NULL) {
1095 if (self->nt == NULL) {
1097 PyErr_NoMemory();
1096 PyErr_NoMemory();
1098 return -1;
1097 return -1;
1099 }
1098 }
1100 self->ntlength = 1;
1099 self->ntlength = 1;
1101 self->ntrev = (int)index_length(self) - 1;
1100 self->ntrev = (int)index_length(self) - 1;
1102 self->ntlookups = 1;
1101 self->ntlookups = 1;
1103 self->ntmisses = 0;
1102 self->ntmisses = 0;
1104 if (nt_insert(self, nullid, INT_MAX) == -1)
1103 if (nt_insert(self, nullid, INT_MAX) == -1)
1105 return -1;
1104 return -1;
1106 }
1105 }
1107 return 0;
1106 return 0;
1108 }
1107 }
1109
1108
1110 /*
1109 /*
1111 * Return values:
1110 * Return values:
1112 *
1111 *
1113 * -3: error (exception set)
1112 * -3: error (exception set)
1114 * -2: not found (no exception set)
1113 * -2: not found (no exception set)
1115 * rest: valid rev
1114 * rest: valid rev
1116 */
1115 */
1117 static int index_find_node(indexObject *self,
1116 static int index_find_node(indexObject *self,
1118 const char *node, Py_ssize_t nodelen)
1117 const char *node, Py_ssize_t nodelen)
1119 {
1118 {
1120 int rev;
1119 int rev;
1121
1120
1122 self->ntlookups++;
1121 self->ntlookups++;
1123 rev = nt_find(self, node, nodelen, 0);
1122 rev = nt_find(self, node, nodelen, 0);
1124 if (rev >= -1)
1123 if (rev >= -1)
1125 return rev;
1124 return rev;
1126
1125
1127 if (nt_init(self) == -1)
1126 if (nt_init(self) == -1)
1128 return -3;
1127 return -3;
1129
1128
1130 /*
1129 /*
1131 * For the first handful of lookups, we scan the entire index,
1130 * For the first handful of lookups, we scan the entire index,
1132 * and cache only the matching nodes. This optimizes for cases
1131 * and cache only the matching nodes. This optimizes for cases
1133 * like "hg tip", where only a few nodes are accessed.
1132 * like "hg tip", where only a few nodes are accessed.
1134 *
1133 *
1135 * After that, we cache every node we visit, using a single
1134 * After that, we cache every node we visit, using a single
1136 * scan amortized over multiple lookups. This gives the best
1135 * scan amortized over multiple lookups. This gives the best
1137 * bulk performance, e.g. for "hg log".
1136 * bulk performance, e.g. for "hg log".
1138 */
1137 */
1139 if (self->ntmisses++ < 4) {
1138 if (self->ntmisses++ < 4) {
1140 for (rev = self->ntrev - 1; rev >= 0; rev--) {
1139 for (rev = self->ntrev - 1; rev >= 0; rev--) {
1141 const char *n = index_node(self, rev);
1140 const char *n = index_node(self, rev);
1142 if (n == NULL)
1141 if (n == NULL)
1143 return -2;
1142 return -2;
1144 if (memcmp(node, n, nodelen > 20 ? 20 : nodelen) == 0) {
1143 if (memcmp(node, n, nodelen > 20 ? 20 : nodelen) == 0) {
1145 if (nt_insert(self, n, rev) == -1)
1144 if (nt_insert(self, n, rev) == -1)
1146 return -3;
1145 return -3;
1147 break;
1146 break;
1148 }
1147 }
1149 }
1148 }
1150 } else {
1149 } else {
1151 for (rev = self->ntrev - 1; rev >= 0; rev--) {
1150 for (rev = self->ntrev - 1; rev >= 0; rev--) {
1152 const char *n = index_node(self, rev);
1151 const char *n = index_node(self, rev);
1153 if (n == NULL) {
1152 if (n == NULL) {
1154 self->ntrev = rev + 1;
1153 self->ntrev = rev + 1;
1155 return -2;
1154 return -2;
1156 }
1155 }
1157 if (nt_insert(self, n, rev) == -1) {
1156 if (nt_insert(self, n, rev) == -1) {
1158 self->ntrev = rev + 1;
1157 self->ntrev = rev + 1;
1159 return -3;
1158 return -3;
1160 }
1159 }
1161 if (memcmp(node, n, nodelen > 20 ? 20 : nodelen) == 0) {
1160 if (memcmp(node, n, nodelen > 20 ? 20 : nodelen) == 0) {
1162 break;
1161 break;
1163 }
1162 }
1164 }
1163 }
1165 self->ntrev = rev;
1164 self->ntrev = rev;
1166 }
1165 }
1167
1166
1168 if (rev >= 0)
1167 if (rev >= 0)
1169 return rev;
1168 return rev;
1170 return -2;
1169 return -2;
1171 }
1170 }
1172
1171
1173 static void raise_revlog_error(void)
1172 static void raise_revlog_error(void)
1174 {
1173 {
1175 PyObject *mod = NULL, *dict = NULL, *errclass = NULL;
1174 PyObject *mod = NULL, *dict = NULL, *errclass = NULL;
1176
1175
1177 mod = PyImport_ImportModule("mercurial.error");
1176 mod = PyImport_ImportModule("mercurial.error");
1178 if (mod == NULL) {
1177 if (mod == NULL) {
1179 goto cleanup;
1178 goto cleanup;
1180 }
1179 }
1181
1180
1182 dict = PyModule_GetDict(mod);
1181 dict = PyModule_GetDict(mod);
1183 if (dict == NULL) {
1182 if (dict == NULL) {
1184 goto cleanup;
1183 goto cleanup;
1185 }
1184 }
1186 Py_INCREF(dict);
1185 Py_INCREF(dict);
1187
1186
1188 errclass = PyDict_GetItemString(dict, "RevlogError");
1187 errclass = PyDict_GetItemString(dict, "RevlogError");
1189 if (errclass == NULL) {
1188 if (errclass == NULL) {
1190 PyErr_SetString(PyExc_SystemError,
1189 PyErr_SetString(PyExc_SystemError,
1191 "could not find RevlogError");
1190 "could not find RevlogError");
1192 goto cleanup;
1191 goto cleanup;
1193 }
1192 }
1194
1193
1195 /* value of exception is ignored by callers */
1194 /* value of exception is ignored by callers */
1196 PyErr_SetString(errclass, "RevlogError");
1195 PyErr_SetString(errclass, "RevlogError");
1197
1196
1198 cleanup:
1197 cleanup:
1199 Py_XDECREF(dict);
1198 Py_XDECREF(dict);
1200 Py_XDECREF(mod);
1199 Py_XDECREF(mod);
1201 }
1200 }
1202
1201
1203 static PyObject *index_getitem(indexObject *self, PyObject *value)
1202 static PyObject *index_getitem(indexObject *self, PyObject *value)
1204 {
1203 {
1205 char *node;
1204 char *node;
1206 Py_ssize_t nodelen;
1205 Py_ssize_t nodelen;
1207 int rev;
1206 int rev;
1208
1207
1209 if (PyInt_Check(value))
1208 if (PyInt_Check(value))
1210 return index_get(self, PyInt_AS_LONG(value));
1209 return index_get(self, PyInt_AS_LONG(value));
1211
1210
1212 if (node_check(value, &node, &nodelen) == -1)
1211 if (node_check(value, &node, &nodelen) == -1)
1213 return NULL;
1212 return NULL;
1214 rev = index_find_node(self, node, nodelen);
1213 rev = index_find_node(self, node, nodelen);
1215 if (rev >= -1)
1214 if (rev >= -1)
1216 return PyInt_FromLong(rev);
1215 return PyInt_FromLong(rev);
1217 if (rev == -2)
1216 if (rev == -2)
1218 raise_revlog_error();
1217 raise_revlog_error();
1219 return NULL;
1218 return NULL;
1220 }
1219 }
1221
1220
1222 static int nt_partialmatch(indexObject *self, const char *node,
1221 static int nt_partialmatch(indexObject *self, const char *node,
1223 Py_ssize_t nodelen)
1222 Py_ssize_t nodelen)
1224 {
1223 {
1225 int rev;
1224 int rev;
1226
1225
1227 if (nt_init(self) == -1)
1226 if (nt_init(self) == -1)
1228 return -3;
1227 return -3;
1229
1228
1230 if (self->ntrev > 0) {
1229 if (self->ntrev > 0) {
1231 /* ensure that the radix tree is fully populated */
1230 /* ensure that the radix tree is fully populated */
1232 for (rev = self->ntrev - 1; rev >= 0; rev--) {
1231 for (rev = self->ntrev - 1; rev >= 0; rev--) {
1233 const char *n = index_node(self, rev);
1232 const char *n = index_node(self, rev);
1234 if (n == NULL)
1233 if (n == NULL)
1235 return -2;
1234 return -2;
1236 if (nt_insert(self, n, rev) == -1)
1235 if (nt_insert(self, n, rev) == -1)
1237 return -3;
1236 return -3;
1238 }
1237 }
1239 self->ntrev = rev;
1238 self->ntrev = rev;
1240 }
1239 }
1241
1240
1242 return nt_find(self, node, nodelen, 1);
1241 return nt_find(self, node, nodelen, 1);
1243 }
1242 }
1244
1243
1245 static PyObject *index_partialmatch(indexObject *self, PyObject *args)
1244 static PyObject *index_partialmatch(indexObject *self, PyObject *args)
1246 {
1245 {
1247 const char *fullnode;
1246 const char *fullnode;
1248 int nodelen;
1247 int nodelen;
1249 char *node;
1248 char *node;
1250 int rev, i;
1249 int rev, i;
1251
1250
1252 if (!PyArg_ParseTuple(args, "s#", &node, &nodelen))
1251 if (!PyArg_ParseTuple(args, "s#", &node, &nodelen))
1253 return NULL;
1252 return NULL;
1254
1253
1255 if (nodelen < 4) {
1254 if (nodelen < 4) {
1256 PyErr_SetString(PyExc_ValueError, "key too short");
1255 PyErr_SetString(PyExc_ValueError, "key too short");
1257 return NULL;
1256 return NULL;
1258 }
1257 }
1259
1258
1260 if (nodelen > 40) {
1259 if (nodelen > 40) {
1261 PyErr_SetString(PyExc_ValueError, "key too long");
1260 PyErr_SetString(PyExc_ValueError, "key too long");
1262 return NULL;
1261 return NULL;
1263 }
1262 }
1264
1263
1265 for (i = 0; i < nodelen; i++)
1264 for (i = 0; i < nodelen; i++)
1266 hexdigit(node, i);
1265 hexdigit(node, i);
1267 if (PyErr_Occurred()) {
1266 if (PyErr_Occurred()) {
1268 /* input contains non-hex characters */
1267 /* input contains non-hex characters */
1269 PyErr_Clear();
1268 PyErr_Clear();
1270 Py_RETURN_NONE;
1269 Py_RETURN_NONE;
1271 }
1270 }
1272
1271
1273 rev = nt_partialmatch(self, node, nodelen);
1272 rev = nt_partialmatch(self, node, nodelen);
1274
1273
1275 switch (rev) {
1274 switch (rev) {
1276 case -4:
1275 case -4:
1277 raise_revlog_error();
1276 raise_revlog_error();
1278 case -3:
1277 case -3:
1279 return NULL;
1278 return NULL;
1280 case -2:
1279 case -2:
1281 Py_RETURN_NONE;
1280 Py_RETURN_NONE;
1282 case -1:
1281 case -1:
1283 return PyBytes_FromStringAndSize(nullid, 20);
1282 return PyBytes_FromStringAndSize(nullid, 20);
1284 }
1283 }
1285
1284
1286 fullnode = index_node(self, rev);
1285 fullnode = index_node(self, rev);
1287 if (fullnode == NULL) {
1286 if (fullnode == NULL) {
1288 PyErr_Format(PyExc_IndexError,
1287 PyErr_Format(PyExc_IndexError,
1289 "could not access rev %d", rev);
1288 "could not access rev %d", rev);
1290 return NULL;
1289 return NULL;
1291 }
1290 }
1292 return PyBytes_FromStringAndSize(fullnode, 20);
1291 return PyBytes_FromStringAndSize(fullnode, 20);
1293 }
1292 }
1294
1293
1295 static PyObject *index_m_get(indexObject *self, PyObject *args)
1294 static PyObject *index_m_get(indexObject *self, PyObject *args)
1296 {
1295 {
1297 Py_ssize_t nodelen;
1296 Py_ssize_t nodelen;
1298 PyObject *val;
1297 PyObject *val;
1299 char *node;
1298 char *node;
1300 int rev;
1299 int rev;
1301
1300
1302 if (!PyArg_ParseTuple(args, "O", &val))
1301 if (!PyArg_ParseTuple(args, "O", &val))
1303 return NULL;
1302 return NULL;
1304 if (node_check(val, &node, &nodelen) == -1)
1303 if (node_check(val, &node, &nodelen) == -1)
1305 return NULL;
1304 return NULL;
1306 rev = index_find_node(self, node, nodelen);
1305 rev = index_find_node(self, node, nodelen);
1307 if (rev == -3)
1306 if (rev == -3)
1308 return NULL;
1307 return NULL;
1309 if (rev == -2)
1308 if (rev == -2)
1310 Py_RETURN_NONE;
1309 Py_RETURN_NONE;
1311 return PyInt_FromLong(rev);
1310 return PyInt_FromLong(rev);
1312 }
1311 }
1313
1312
1314 static int index_contains(indexObject *self, PyObject *value)
1313 static int index_contains(indexObject *self, PyObject *value)
1315 {
1314 {
1316 char *node;
1315 char *node;
1317 Py_ssize_t nodelen;
1316 Py_ssize_t nodelen;
1318
1317
1319 if (PyInt_Check(value)) {
1318 if (PyInt_Check(value)) {
1320 long rev = PyInt_AS_LONG(value);
1319 long rev = PyInt_AS_LONG(value);
1321 return rev >= -1 && rev < index_length(self);
1320 return rev >= -1 && rev < index_length(self);
1322 }
1321 }
1323
1322
1324 if (node_check(value, &node, &nodelen) == -1)
1323 if (node_check(value, &node, &nodelen) == -1)
1325 return -1;
1324 return -1;
1326
1325
1327 switch (index_find_node(self, node, nodelen)) {
1326 switch (index_find_node(self, node, nodelen)) {
1328 case -3:
1327 case -3:
1329 return -1;
1328 return -1;
1330 case -2:
1329 case -2:
1331 return 0;
1330 return 0;
1332 default:
1331 default:
1333 return 1;
1332 return 1;
1334 }
1333 }
1335 }
1334 }
1336
1335
1337 typedef uint64_t bitmask;
1336 typedef uint64_t bitmask;
1338
1337
1339 /*
1338 /*
1340 * Given a disjoint set of revs, return all candidates for the
1339 * Given a disjoint set of revs, return all candidates for the
1341 * greatest common ancestor. In revset notation, this is the set
1340 * greatest common ancestor. In revset notation, this is the set
1342 * "heads(::a and ::b and ...)"
1341 * "heads(::a and ::b and ...)"
1343 */
1342 */
1344 static PyObject *find_gca_candidates(indexObject *self, const int *revs,
1343 static PyObject *find_gca_candidates(indexObject *self, const int *revs,
1345 int revcount)
1344 int revcount)
1346 {
1345 {
1347 const bitmask allseen = (1ull << revcount) - 1;
1346 const bitmask allseen = (1ull << revcount) - 1;
1348 const bitmask poison = 1ull << revcount;
1347 const bitmask poison = 1ull << revcount;
1349 PyObject *gca = PyList_New(0);
1348 PyObject *gca = PyList_New(0);
1350 int i, v, interesting;
1349 int i, v, interesting;
1351 int maxrev = -1;
1350 int maxrev = -1;
1352 bitmask sp;
1351 bitmask sp;
1353 bitmask *seen;
1352 bitmask *seen;
1354
1353
1355 if (gca == NULL)
1354 if (gca == NULL)
1356 return PyErr_NoMemory();
1355 return PyErr_NoMemory();
1357
1356
1358 for (i = 0; i < revcount; i++) {
1357 for (i = 0; i < revcount; i++) {
1359 if (revs[i] > maxrev)
1358 if (revs[i] > maxrev)
1360 maxrev = revs[i];
1359 maxrev = revs[i];
1361 }
1360 }
1362
1361
1363 seen = calloc(sizeof(*seen), maxrev + 1);
1362 seen = calloc(sizeof(*seen), maxrev + 1);
1364 if (seen == NULL) {
1363 if (seen == NULL) {
1365 Py_DECREF(gca);
1364 Py_DECREF(gca);
1366 return PyErr_NoMemory();
1365 return PyErr_NoMemory();
1367 }
1366 }
1368
1367
1369 for (i = 0; i < revcount; i++)
1368 for (i = 0; i < revcount; i++)
1370 seen[revs[i]] = 1ull << i;
1369 seen[revs[i]] = 1ull << i;
1371
1370
1372 interesting = revcount;
1371 interesting = revcount;
1373
1372
1374 for (v = maxrev; v >= 0 && interesting; v--) {
1373 for (v = maxrev; v >= 0 && interesting; v--) {
1375 bitmask sv = seen[v];
1374 bitmask sv = seen[v];
1376 int parents[2];
1375 int parents[2];
1377
1376
1378 if (!sv)
1377 if (!sv)
1379 continue;
1378 continue;
1380
1379
1381 if (sv < poison) {
1380 if (sv < poison) {
1382 interesting -= 1;
1381 interesting -= 1;
1383 if (sv == allseen) {
1382 if (sv == allseen) {
1384 PyObject *obj = PyInt_FromLong(v);
1383 PyObject *obj = PyInt_FromLong(v);
1385 if (obj == NULL)
1384 if (obj == NULL)
1386 goto bail;
1385 goto bail;
1387 if (PyList_Append(gca, obj) == -1) {
1386 if (PyList_Append(gca, obj) == -1) {
1388 Py_DECREF(obj);
1387 Py_DECREF(obj);
1389 goto bail;
1388 goto bail;
1390 }
1389 }
1391 sv |= poison;
1390 sv |= poison;
1392 for (i = 0; i < revcount; i++) {
1391 for (i = 0; i < revcount; i++) {
1393 if (revs[i] == v)
1392 if (revs[i] == v)
1394 goto done;
1393 goto done;
1395 }
1394 }
1396 }
1395 }
1397 }
1396 }
1398 if (index_get_parents(self, v, parents, maxrev) < 0)
1397 if (index_get_parents(self, v, parents, maxrev) < 0)
1399 goto bail;
1398 goto bail;
1400
1399
1401 for (i = 0; i < 2; i++) {
1400 for (i = 0; i < 2; i++) {
1402 int p = parents[i];
1401 int p = parents[i];
1403 if (p == -1)
1402 if (p == -1)
1404 continue;
1403 continue;
1405 sp = seen[p];
1404 sp = seen[p];
1406 if (sv < poison) {
1405 if (sv < poison) {
1407 if (sp == 0) {
1406 if (sp == 0) {
1408 seen[p] = sv;
1407 seen[p] = sv;
1409 interesting++;
1408 interesting++;
1410 }
1409 }
1411 else if (sp != sv)
1410 else if (sp != sv)
1412 seen[p] |= sv;
1411 seen[p] |= sv;
1413 } else {
1412 } else {
1414 if (sp && sp < poison)
1413 if (sp && sp < poison)
1415 interesting--;
1414 interesting--;
1416 seen[p] = sv;
1415 seen[p] = sv;
1417 }
1416 }
1418 }
1417 }
1419 }
1418 }
1420
1419
1421 done:
1420 done:
1422 free(seen);
1421 free(seen);
1423 return gca;
1422 return gca;
1424 bail:
1423 bail:
1425 free(seen);
1424 free(seen);
1426 Py_XDECREF(gca);
1425 Py_XDECREF(gca);
1427 return NULL;
1426 return NULL;
1428 }
1427 }
1429
1428
1430 /*
1429 /*
1431 * Given a disjoint set of revs, return the subset with the longest
1430 * Given a disjoint set of revs, return the subset with the longest
1432 * path to the root.
1431 * path to the root.
1433 */
1432 */
1434 static PyObject *find_deepest(indexObject *self, PyObject *revs)
1433 static PyObject *find_deepest(indexObject *self, PyObject *revs)
1435 {
1434 {
1436 const Py_ssize_t revcount = PyList_GET_SIZE(revs);
1435 const Py_ssize_t revcount = PyList_GET_SIZE(revs);
1437 static const Py_ssize_t capacity = 24;
1436 static const Py_ssize_t capacity = 24;
1438 int *depth, *interesting = NULL;
1437 int *depth, *interesting = NULL;
1439 int i, j, v, ninteresting;
1438 int i, j, v, ninteresting;
1440 PyObject *dict = NULL, *keys = NULL;
1439 PyObject *dict = NULL, *keys = NULL;
1441 long *seen = NULL;
1440 long *seen = NULL;
1442 int maxrev = -1;
1441 int maxrev = -1;
1443 long final;
1442 long final;
1444
1443
1445 if (revcount > capacity) {
1444 if (revcount > capacity) {
1446 PyErr_Format(PyExc_OverflowError,
1445 PyErr_Format(PyExc_OverflowError,
1447 "bitset size (%ld) > capacity (%ld)",
1446 "bitset size (%ld) > capacity (%ld)",
1448 (long)revcount, (long)capacity);
1447 (long)revcount, (long)capacity);
1449 return NULL;
1448 return NULL;
1450 }
1449 }
1451
1450
1452 for (i = 0; i < revcount; i++) {
1451 for (i = 0; i < revcount; i++) {
1453 int n = (int)PyInt_AsLong(PyList_GET_ITEM(revs, i));
1452 int n = (int)PyInt_AsLong(PyList_GET_ITEM(revs, i));
1454 if (n > maxrev)
1453 if (n > maxrev)
1455 maxrev = n;
1454 maxrev = n;
1456 }
1455 }
1457
1456
1458 depth = calloc(sizeof(*depth), maxrev + 1);
1457 depth = calloc(sizeof(*depth), maxrev + 1);
1459 if (depth == NULL)
1458 if (depth == NULL)
1460 return PyErr_NoMemory();
1459 return PyErr_NoMemory();
1461
1460
1462 seen = calloc(sizeof(*seen), maxrev + 1);
1461 seen = calloc(sizeof(*seen), maxrev + 1);
1463 if (seen == NULL) {
1462 if (seen == NULL) {
1464 PyErr_NoMemory();
1463 PyErr_NoMemory();
1465 goto bail;
1464 goto bail;
1466 }
1465 }
1467
1466
1468 interesting = calloc(sizeof(*interesting), 1 << revcount);
1467 interesting = calloc(sizeof(*interesting), 1 << revcount);
1469 if (interesting == NULL) {
1468 if (interesting == NULL) {
1470 PyErr_NoMemory();
1469 PyErr_NoMemory();
1471 goto bail;
1470 goto bail;
1472 }
1471 }
1473
1472
1474 if (PyList_Sort(revs) == -1)
1473 if (PyList_Sort(revs) == -1)
1475 goto bail;
1474 goto bail;
1476
1475
1477 for (i = 0; i < revcount; i++) {
1476 for (i = 0; i < revcount; i++) {
1478 int n = (int)PyInt_AsLong(PyList_GET_ITEM(revs, i));
1477 int n = (int)PyInt_AsLong(PyList_GET_ITEM(revs, i));
1479 long b = 1l << i;
1478 long b = 1l << i;
1480 depth[n] = 1;
1479 depth[n] = 1;
1481 seen[n] = b;
1480 seen[n] = b;
1482 interesting[b] = 1;
1481 interesting[b] = 1;
1483 }
1482 }
1484
1483
1485 /* invariant: ninteresting is the number of non-zero entries in
1484 /* invariant: ninteresting is the number of non-zero entries in
1486 * interesting. */
1485 * interesting. */
1487 ninteresting = (int)revcount;
1486 ninteresting = (int)revcount;
1488
1487
1489 for (v = maxrev; v >= 0 && ninteresting > 1; v--) {
1488 for (v = maxrev; v >= 0 && ninteresting > 1; v--) {
1490 int dv = depth[v];
1489 int dv = depth[v];
1491 int parents[2];
1490 int parents[2];
1492 long sv;
1491 long sv;
1493
1492
1494 if (dv == 0)
1493 if (dv == 0)
1495 continue;
1494 continue;
1496
1495
1497 sv = seen[v];
1496 sv = seen[v];
1498 if (index_get_parents(self, v, parents, maxrev) < 0)
1497 if (index_get_parents(self, v, parents, maxrev) < 0)
1499 goto bail;
1498 goto bail;
1500
1499
1501 for (i = 0; i < 2; i++) {
1500 for (i = 0; i < 2; i++) {
1502 int p = parents[i];
1501 int p = parents[i];
1503 long sp;
1502 long sp;
1504 int dp;
1503 int dp;
1505
1504
1506 if (p == -1)
1505 if (p == -1)
1507 continue;
1506 continue;
1508
1507
1509 dp = depth[p];
1508 dp = depth[p];
1510 sp = seen[p];
1509 sp = seen[p];
1511 if (dp <= dv) {
1510 if (dp <= dv) {
1512 depth[p] = dv + 1;
1511 depth[p] = dv + 1;
1513 if (sp != sv) {
1512 if (sp != sv) {
1514 interesting[sv] += 1;
1513 interesting[sv] += 1;
1515 seen[p] = sv;
1514 seen[p] = sv;
1516 if (sp) {
1515 if (sp) {
1517 interesting[sp] -= 1;
1516 interesting[sp] -= 1;
1518 if (interesting[sp] == 0)
1517 if (interesting[sp] == 0)
1519 ninteresting -= 1;
1518 ninteresting -= 1;
1520 }
1519 }
1521 }
1520 }
1522 }
1521 }
1523 else if (dv == dp - 1) {
1522 else if (dv == dp - 1) {
1524 long nsp = sp | sv;
1523 long nsp = sp | sv;
1525 if (nsp == sp)
1524 if (nsp == sp)
1526 continue;
1525 continue;
1527 seen[p] = nsp;
1526 seen[p] = nsp;
1528 interesting[sp] -= 1;
1527 interesting[sp] -= 1;
1529 if (interesting[sp] == 0)
1528 if (interesting[sp] == 0)
1530 ninteresting -= 1;
1529 ninteresting -= 1;
1531 if (interesting[nsp] == 0)
1530 if (interesting[nsp] == 0)
1532 ninteresting += 1;
1531 ninteresting += 1;
1533 interesting[nsp] += 1;
1532 interesting[nsp] += 1;
1534 }
1533 }
1535 }
1534 }
1536 interesting[sv] -= 1;
1535 interesting[sv] -= 1;
1537 if (interesting[sv] == 0)
1536 if (interesting[sv] == 0)
1538 ninteresting -= 1;
1537 ninteresting -= 1;
1539 }
1538 }
1540
1539
1541 final = 0;
1540 final = 0;
1542 j = ninteresting;
1541 j = ninteresting;
1543 for (i = 0; i < (int)(2 << revcount) && j > 0; i++) {
1542 for (i = 0; i < (int)(2 << revcount) && j > 0; i++) {
1544 if (interesting[i] == 0)
1543 if (interesting[i] == 0)
1545 continue;
1544 continue;
1546 final |= i;
1545 final |= i;
1547 j -= 1;
1546 j -= 1;
1548 }
1547 }
1549 if (final == 0) {
1548 if (final == 0) {
1550 keys = PyList_New(0);
1549 keys = PyList_New(0);
1551 goto bail;
1550 goto bail;
1552 }
1551 }
1553
1552
1554 dict = PyDict_New();
1553 dict = PyDict_New();
1555 if (dict == NULL)
1554 if (dict == NULL)
1556 goto bail;
1555 goto bail;
1557
1556
1558 for (i = 0; i < revcount; i++) {
1557 for (i = 0; i < revcount; i++) {
1559 PyObject *key;
1558 PyObject *key;
1560
1559
1561 if ((final & (1 << i)) == 0)
1560 if ((final & (1 << i)) == 0)
1562 continue;
1561 continue;
1563
1562
1564 key = PyList_GET_ITEM(revs, i);
1563 key = PyList_GET_ITEM(revs, i);
1565 Py_INCREF(key);
1564 Py_INCREF(key);
1566 Py_INCREF(Py_None);
1565 Py_INCREF(Py_None);
1567 if (PyDict_SetItem(dict, key, Py_None) == -1) {
1566 if (PyDict_SetItem(dict, key, Py_None) == -1) {
1568 Py_DECREF(key);
1567 Py_DECREF(key);
1569 Py_DECREF(Py_None);
1568 Py_DECREF(Py_None);
1570 goto bail;
1569 goto bail;
1571 }
1570 }
1572 }
1571 }
1573
1572
1574 keys = PyDict_Keys(dict);
1573 keys = PyDict_Keys(dict);
1575
1574
1576 bail:
1575 bail:
1577 free(depth);
1576 free(depth);
1578 free(seen);
1577 free(seen);
1579 free(interesting);
1578 free(interesting);
1580 Py_XDECREF(dict);
1579 Py_XDECREF(dict);
1581
1580
1582 return keys;
1581 return keys;
1583 }
1582 }
1584
1583
1585 /*
1584 /*
1586 * Given a (possibly overlapping) set of revs, return all the
1585 * Given a (possibly overlapping) set of revs, return all the
1587 * common ancestors heads: heads(::args[0] and ::a[1] and ...)
1586 * common ancestors heads: heads(::args[0] and ::a[1] and ...)
1588 */
1587 */
1589 static PyObject *index_commonancestorsheads(indexObject *self, PyObject *args)
1588 static PyObject *index_commonancestorsheads(indexObject *self, PyObject *args)
1590 {
1589 {
1591 PyObject *ret = NULL;
1590 PyObject *ret = NULL;
1592 Py_ssize_t argcount, i, len;
1591 Py_ssize_t argcount, i, len;
1593 bitmask repeat = 0;
1592 bitmask repeat = 0;
1594 int revcount = 0;
1593 int revcount = 0;
1595 int *revs;
1594 int *revs;
1596
1595
1597 argcount = PySequence_Length(args);
1596 argcount = PySequence_Length(args);
1598 revs = PyMem_Malloc(argcount * sizeof(*revs));
1597 revs = PyMem_Malloc(argcount * sizeof(*revs));
1599 if (argcount > 0 && revs == NULL)
1598 if (argcount > 0 && revs == NULL)
1600 return PyErr_NoMemory();
1599 return PyErr_NoMemory();
1601 len = index_length(self) - 1;
1600 len = index_length(self) - 1;
1602
1601
1603 for (i = 0; i < argcount; i++) {
1602 for (i = 0; i < argcount; i++) {
1604 static const int capacity = 24;
1603 static const int capacity = 24;
1605 PyObject *obj = PySequence_GetItem(args, i);
1604 PyObject *obj = PySequence_GetItem(args, i);
1606 bitmask x;
1605 bitmask x;
1607 long val;
1606 long val;
1608
1607
1609 if (!PyInt_Check(obj)) {
1608 if (!PyInt_Check(obj)) {
1610 PyErr_SetString(PyExc_TypeError,
1609 PyErr_SetString(PyExc_TypeError,
1611 "arguments must all be ints");
1610 "arguments must all be ints");
1612 Py_DECREF(obj);
1611 Py_DECREF(obj);
1613 goto bail;
1612 goto bail;
1614 }
1613 }
1615 val = PyInt_AsLong(obj);
1614 val = PyInt_AsLong(obj);
1616 Py_DECREF(obj);
1615 Py_DECREF(obj);
1617 if (val == -1) {
1616 if (val == -1) {
1618 ret = PyList_New(0);
1617 ret = PyList_New(0);
1619 goto done;
1618 goto done;
1620 }
1619 }
1621 if (val < 0 || val >= len) {
1620 if (val < 0 || val >= len) {
1622 PyErr_SetString(PyExc_IndexError,
1621 PyErr_SetString(PyExc_IndexError,
1623 "index out of range");
1622 "index out of range");
1624 goto bail;
1623 goto bail;
1625 }
1624 }
1626 /* this cheesy bloom filter lets us avoid some more
1625 /* this cheesy bloom filter lets us avoid some more
1627 * expensive duplicate checks in the common set-is-disjoint
1626 * expensive duplicate checks in the common set-is-disjoint
1628 * case */
1627 * case */
1629 x = 1ull << (val & 0x3f);
1628 x = 1ull << (val & 0x3f);
1630 if (repeat & x) {
1629 if (repeat & x) {
1631 int k;
1630 int k;
1632 for (k = 0; k < revcount; k++) {
1631 for (k = 0; k < revcount; k++) {
1633 if (val == revs[k])
1632 if (val == revs[k])
1634 goto duplicate;
1633 goto duplicate;
1635 }
1634 }
1636 }
1635 }
1637 else repeat |= x;
1636 else repeat |= x;
1638 if (revcount >= capacity) {
1637 if (revcount >= capacity) {
1639 PyErr_Format(PyExc_OverflowError,
1638 PyErr_Format(PyExc_OverflowError,
1640 "bitset size (%d) > capacity (%d)",
1639 "bitset size (%d) > capacity (%d)",
1641 revcount, capacity);
1640 revcount, capacity);
1642 goto bail;
1641 goto bail;
1643 }
1642 }
1644 revs[revcount++] = (int)val;
1643 revs[revcount++] = (int)val;
1645 duplicate:;
1644 duplicate:;
1646 }
1645 }
1647
1646
1648 if (revcount == 0) {
1647 if (revcount == 0) {
1649 ret = PyList_New(0);
1648 ret = PyList_New(0);
1650 goto done;
1649 goto done;
1651 }
1650 }
1652 if (revcount == 1) {
1651 if (revcount == 1) {
1653 PyObject *obj;
1652 PyObject *obj;
1654 ret = PyList_New(1);
1653 ret = PyList_New(1);
1655 if (ret == NULL)
1654 if (ret == NULL)
1656 goto bail;
1655 goto bail;
1657 obj = PyInt_FromLong(revs[0]);
1656 obj = PyInt_FromLong(revs[0]);
1658 if (obj == NULL)
1657 if (obj == NULL)
1659 goto bail;
1658 goto bail;
1660 PyList_SET_ITEM(ret, 0, obj);
1659 PyList_SET_ITEM(ret, 0, obj);
1661 goto done;
1660 goto done;
1662 }
1661 }
1663
1662
1664 ret = find_gca_candidates(self, revs, revcount);
1663 ret = find_gca_candidates(self, revs, revcount);
1665 if (ret == NULL)
1664 if (ret == NULL)
1666 goto bail;
1665 goto bail;
1667
1666
1668 done:
1667 done:
1669 PyMem_Free(revs);
1668 PyMem_Free(revs);
1670 return ret;
1669 return ret;
1671
1670
1672 bail:
1671 bail:
1673 PyMem_Free(revs);
1672 PyMem_Free(revs);
1674 Py_XDECREF(ret);
1673 Py_XDECREF(ret);
1675 return NULL;
1674 return NULL;
1676 }
1675 }
1677
1676
1678 /*
1677 /*
1679 * Given a (possibly overlapping) set of revs, return the greatest
1678 * Given a (possibly overlapping) set of revs, return the greatest
1680 * common ancestors: those with the longest path to the root.
1679 * common ancestors: those with the longest path to the root.
1681 */
1680 */
1682 static PyObject *index_ancestors(indexObject *self, PyObject *args)
1681 static PyObject *index_ancestors(indexObject *self, PyObject *args)
1683 {
1682 {
1684 PyObject *ret;
1683 PyObject *ret;
1685 PyObject *gca = index_commonancestorsheads(self, args);
1684 PyObject *gca = index_commonancestorsheads(self, args);
1686 if (gca == NULL)
1685 if (gca == NULL)
1687 return NULL;
1686 return NULL;
1688
1687
1689 if (PyList_GET_SIZE(gca) <= 1) {
1688 if (PyList_GET_SIZE(gca) <= 1) {
1690 return gca;
1689 return gca;
1691 }
1690 }
1692
1691
1693 ret = find_deepest(self, gca);
1692 ret = find_deepest(self, gca);
1694 Py_DECREF(gca);
1693 Py_DECREF(gca);
1695 return ret;
1694 return ret;
1696 }
1695 }
1697
1696
1698 /*
1697 /*
1699 * Invalidate any trie entries introduced by added revs.
1698 * Invalidate any trie entries introduced by added revs.
1700 */
1699 */
1701 static void nt_invalidate_added(indexObject *self, Py_ssize_t start)
1700 static void nt_invalidate_added(indexObject *self, Py_ssize_t start)
1702 {
1701 {
1703 Py_ssize_t i, len = PyList_GET_SIZE(self->added);
1702 Py_ssize_t i, len = PyList_GET_SIZE(self->added);
1704
1703
1705 for (i = start; i < len; i++) {
1704 for (i = start; i < len; i++) {
1706 PyObject *tuple = PyList_GET_ITEM(self->added, i);
1705 PyObject *tuple = PyList_GET_ITEM(self->added, i);
1707 PyObject *node = PyTuple_GET_ITEM(tuple, 7);
1706 PyObject *node = PyTuple_GET_ITEM(tuple, 7);
1708
1707
1709 nt_insert(self, PyBytes_AS_STRING(node), -1);
1708 nt_insert(self, PyBytes_AS_STRING(node), -1);
1710 }
1709 }
1711
1710
1712 if (start == 0)
1711 if (start == 0)
1713 Py_CLEAR(self->added);
1712 Py_CLEAR(self->added);
1714 }
1713 }
1715
1714
1716 /*
1715 /*
1717 * Delete a numeric range of revs, which must be at the end of the
1716 * Delete a numeric range of revs, which must be at the end of the
1718 * range, but exclude the sentinel nullid entry.
1717 * range, but exclude the sentinel nullid entry.
1719 */
1718 */
1720 static int index_slice_del(indexObject *self, PyObject *item)
1719 static int index_slice_del(indexObject *self, PyObject *item)
1721 {
1720 {
1722 Py_ssize_t start, stop, step, slicelength;
1721 Py_ssize_t start, stop, step, slicelength;
1723 Py_ssize_t length = index_length(self);
1722 Py_ssize_t length = index_length(self);
1724 int ret = 0;
1723 int ret = 0;
1725
1724
1726 /* Argument changed from PySliceObject* to PyObject* in Python 3. */
1725 /* Argument changed from PySliceObject* to PyObject* in Python 3. */
1727 #ifdef IS_PY3K
1726 #ifdef IS_PY3K
1728 if (PySlice_GetIndicesEx(item, length,
1727 if (PySlice_GetIndicesEx(item, length,
1729 #else
1728 #else
1730 if (PySlice_GetIndicesEx((PySliceObject*)item, length,
1729 if (PySlice_GetIndicesEx((PySliceObject*)item, length,
1731 #endif
1730 #endif
1732 &start, &stop, &step, &slicelength) < 0)
1731 &start, &stop, &step, &slicelength) < 0)
1733 return -1;
1732 return -1;
1734
1733
1735 if (slicelength <= 0)
1734 if (slicelength <= 0)
1736 return 0;
1735 return 0;
1737
1736
1738 if ((step < 0 && start < stop) || (step > 0 && start > stop))
1737 if ((step < 0 && start < stop) || (step > 0 && start > stop))
1739 stop = start;
1738 stop = start;
1740
1739
1741 if (step < 0) {
1740 if (step < 0) {
1742 stop = start + 1;
1741 stop = start + 1;
1743 start = stop + step*(slicelength - 1) - 1;
1742 start = stop + step*(slicelength - 1) - 1;
1744 step = -step;
1743 step = -step;
1745 }
1744 }
1746
1745
1747 if (step != 1) {
1746 if (step != 1) {
1748 PyErr_SetString(PyExc_ValueError,
1747 PyErr_SetString(PyExc_ValueError,
1749 "revlog index delete requires step size of 1");
1748 "revlog index delete requires step size of 1");
1750 return -1;
1749 return -1;
1751 }
1750 }
1752
1751
1753 if (stop != length - 1) {
1752 if (stop != length - 1) {
1754 PyErr_SetString(PyExc_IndexError,
1753 PyErr_SetString(PyExc_IndexError,
1755 "revlog index deletion indices are invalid");
1754 "revlog index deletion indices are invalid");
1756 return -1;
1755 return -1;
1757 }
1756 }
1758
1757
1759 if (start < self->length - 1) {
1758 if (start < self->length - 1) {
1760 if (self->nt) {
1759 if (self->nt) {
1761 Py_ssize_t i;
1760 Py_ssize_t i;
1762
1761
1763 for (i = start + 1; i < self->length - 1; i++) {
1762 for (i = start + 1; i < self->length - 1; i++) {
1764 const char *node = index_node(self, i);
1763 const char *node = index_node(self, i);
1765
1764
1766 if (node)
1765 if (node)
1767 nt_insert(self, node, -1);
1766 nt_insert(self, node, -1);
1768 }
1767 }
1769 if (self->added)
1768 if (self->added)
1770 nt_invalidate_added(self, 0);
1769 nt_invalidate_added(self, 0);
1771 if (self->ntrev > start)
1770 if (self->ntrev > start)
1772 self->ntrev = (int)start;
1771 self->ntrev = (int)start;
1773 }
1772 }
1774 self->length = start + 1;
1773 self->length = start + 1;
1775 if (start < self->raw_length) {
1774 if (start < self->raw_length) {
1776 if (self->cache) {
1775 if (self->cache) {
1777 Py_ssize_t i;
1776 Py_ssize_t i;
1778 for (i = start; i < self->raw_length; i++)
1777 for (i = start; i < self->raw_length; i++)
1779 Py_CLEAR(self->cache[i]);
1778 Py_CLEAR(self->cache[i]);
1780 }
1779 }
1781 self->raw_length = start;
1780 self->raw_length = start;
1782 }
1781 }
1783 goto done;
1782 goto done;
1784 }
1783 }
1785
1784
1786 if (self->nt) {
1785 if (self->nt) {
1787 nt_invalidate_added(self, start - self->length + 1);
1786 nt_invalidate_added(self, start - self->length + 1);
1788 if (self->ntrev > start)
1787 if (self->ntrev > start)
1789 self->ntrev = (int)start;
1788 self->ntrev = (int)start;
1790 }
1789 }
1791 if (self->added)
1790 if (self->added)
1792 ret = PyList_SetSlice(self->added, start - self->length + 1,
1791 ret = PyList_SetSlice(self->added, start - self->length + 1,
1793 PyList_GET_SIZE(self->added), NULL);
1792 PyList_GET_SIZE(self->added), NULL);
1794 done:
1793 done:
1795 Py_CLEAR(self->headrevs);
1794 Py_CLEAR(self->headrevs);
1796 return ret;
1795 return ret;
1797 }
1796 }
1798
1797
1799 /*
1798 /*
1800 * Supported ops:
1799 * Supported ops:
1801 *
1800 *
1802 * slice deletion
1801 * slice deletion
1803 * string assignment (extend node->rev mapping)
1802 * string assignment (extend node->rev mapping)
1804 * string deletion (shrink node->rev mapping)
1803 * string deletion (shrink node->rev mapping)
1805 */
1804 */
1806 static int index_assign_subscript(indexObject *self, PyObject *item,
1805 static int index_assign_subscript(indexObject *self, PyObject *item,
1807 PyObject *value)
1806 PyObject *value)
1808 {
1807 {
1809 char *node;
1808 char *node;
1810 Py_ssize_t nodelen;
1809 Py_ssize_t nodelen;
1811 long rev;
1810 long rev;
1812
1811
1813 if (PySlice_Check(item) && value == NULL)
1812 if (PySlice_Check(item) && value == NULL)
1814 return index_slice_del(self, item);
1813 return index_slice_del(self, item);
1815
1814
1816 if (node_check(item, &node, &nodelen) == -1)
1815 if (node_check(item, &node, &nodelen) == -1)
1817 return -1;
1816 return -1;
1818
1817
1819 if (value == NULL)
1818 if (value == NULL)
1820 return self->nt ? nt_insert(self, node, -1) : 0;
1819 return self->nt ? nt_insert(self, node, -1) : 0;
1821 rev = PyInt_AsLong(value);
1820 rev = PyInt_AsLong(value);
1822 if (rev > INT_MAX || rev < 0) {
1821 if (rev > INT_MAX || rev < 0) {
1823 if (!PyErr_Occurred())
1822 if (!PyErr_Occurred())
1824 PyErr_SetString(PyExc_ValueError, "rev out of range");
1823 PyErr_SetString(PyExc_ValueError, "rev out of range");
1825 return -1;
1824 return -1;
1826 }
1825 }
1827
1826
1828 if (nt_init(self) == -1)
1827 if (nt_init(self) == -1)
1829 return -1;
1828 return -1;
1830 return nt_insert(self, node, (int)rev);
1829 return nt_insert(self, node, (int)rev);
1831 }
1830 }
1832
1831
1833 /*
1832 /*
1834 * Find all RevlogNG entries in an index that has inline data. Update
1833 * Find all RevlogNG entries in an index that has inline data. Update
1835 * the optional "offsets" table with those entries.
1834 * the optional "offsets" table with those entries.
1836 */
1835 */
1837 static Py_ssize_t inline_scan(indexObject *self, const char **offsets)
1836 static Py_ssize_t inline_scan(indexObject *self, const char **offsets)
1838 {
1837 {
1839 const char *data = (const char *)self->buf.buf;
1838 const char *data = (const char *)self->buf.buf;
1840 Py_ssize_t pos = 0;
1839 Py_ssize_t pos = 0;
1841 Py_ssize_t end = self->buf.len;
1840 Py_ssize_t end = self->buf.len;
1842 long incr = v1_hdrsize;
1841 long incr = v1_hdrsize;
1843 Py_ssize_t len = 0;
1842 Py_ssize_t len = 0;
1844
1843
1845 while (pos + v1_hdrsize <= end && pos >= 0) {
1844 while (pos + v1_hdrsize <= end && pos >= 0) {
1846 uint32_t comp_len;
1845 uint32_t comp_len;
1847 /* 3rd element of header is length of compressed inline data */
1846 /* 3rd element of header is length of compressed inline data */
1848 comp_len = getbe32(data + pos + 8);
1847 comp_len = getbe32(data + pos + 8);
1849 incr = v1_hdrsize + comp_len;
1848 incr = v1_hdrsize + comp_len;
1850 if (offsets)
1849 if (offsets)
1851 offsets[len] = data + pos;
1850 offsets[len] = data + pos;
1852 len++;
1851 len++;
1853 pos += incr;
1852 pos += incr;
1854 }
1853 }
1855
1854
1856 if (pos != end) {
1855 if (pos != end) {
1857 if (!PyErr_Occurred())
1856 if (!PyErr_Occurred())
1858 PyErr_SetString(PyExc_ValueError, "corrupt index file");
1857 PyErr_SetString(PyExc_ValueError, "corrupt index file");
1859 return -1;
1858 return -1;
1860 }
1859 }
1861
1860
1862 return len;
1861 return len;
1863 }
1862 }
1864
1863
1865 static int index_init(indexObject *self, PyObject *args)
1864 static int index_init(indexObject *self, PyObject *args)
1866 {
1865 {
1867 PyObject *data_obj, *inlined_obj;
1866 PyObject *data_obj, *inlined_obj;
1868 Py_ssize_t size;
1867 Py_ssize_t size;
1869
1868
1870 /* Initialize before argument-checking to avoid index_dealloc() crash. */
1869 /* Initialize before argument-checking to avoid index_dealloc() crash. */
1871 self->raw_length = 0;
1870 self->raw_length = 0;
1872 self->added = NULL;
1871 self->added = NULL;
1873 self->cache = NULL;
1872 self->cache = NULL;
1874 self->data = NULL;
1873 self->data = NULL;
1875 memset(&self->buf, 0, sizeof(self->buf));
1874 memset(&self->buf, 0, sizeof(self->buf));
1876 self->headrevs = NULL;
1875 self->headrevs = NULL;
1877 self->filteredrevs = Py_None;
1876 self->filteredrevs = Py_None;
1878 Py_INCREF(Py_None);
1877 Py_INCREF(Py_None);
1879 self->nt = NULL;
1878 self->nt = NULL;
1880 self->offsets = NULL;
1879 self->offsets = NULL;
1881
1880
1882 if (!PyArg_ParseTuple(args, "OO", &data_obj, &inlined_obj))
1881 if (!PyArg_ParseTuple(args, "OO", &data_obj, &inlined_obj))
1883 return -1;
1882 return -1;
1884 if (!PyObject_CheckBuffer(data_obj)) {
1883 if (!PyObject_CheckBuffer(data_obj)) {
1885 PyErr_SetString(PyExc_TypeError,
1884 PyErr_SetString(PyExc_TypeError,
1886 "data does not support buffer interface");
1885 "data does not support buffer interface");
1887 return -1;
1886 return -1;
1888 }
1887 }
1889
1888
1890 if (PyObject_GetBuffer(data_obj, &self->buf, PyBUF_SIMPLE) == -1)
1889 if (PyObject_GetBuffer(data_obj, &self->buf, PyBUF_SIMPLE) == -1)
1891 return -1;
1890 return -1;
1892 size = self->buf.len;
1891 size = self->buf.len;
1893
1892
1894 self->inlined = inlined_obj && PyObject_IsTrue(inlined_obj);
1893 self->inlined = inlined_obj && PyObject_IsTrue(inlined_obj);
1895 self->data = data_obj;
1894 self->data = data_obj;
1896
1895
1897 self->ntlength = self->ntcapacity = 0;
1896 self->ntlength = self->ntcapacity = 0;
1898 self->ntdepth = self->ntsplits = 0;
1897 self->ntdepth = self->ntsplits = 0;
1899 self->ntlookups = self->ntmisses = 0;
1898 self->ntlookups = self->ntmisses = 0;
1900 self->ntrev = -1;
1899 self->ntrev = -1;
1901 Py_INCREF(self->data);
1900 Py_INCREF(self->data);
1902
1901
1903 if (self->inlined) {
1902 if (self->inlined) {
1904 Py_ssize_t len = inline_scan(self, NULL);
1903 Py_ssize_t len = inline_scan(self, NULL);
1905 if (len == -1)
1904 if (len == -1)
1906 goto bail;
1905 goto bail;
1907 self->raw_length = len;
1906 self->raw_length = len;
1908 self->length = len + 1;
1907 self->length = len + 1;
1909 } else {
1908 } else {
1910 if (size % v1_hdrsize) {
1909 if (size % v1_hdrsize) {
1911 PyErr_SetString(PyExc_ValueError, "corrupt index file");
1910 PyErr_SetString(PyExc_ValueError, "corrupt index file");
1912 goto bail;
1911 goto bail;
1913 }
1912 }
1914 self->raw_length = size / v1_hdrsize;
1913 self->raw_length = size / v1_hdrsize;
1915 self->length = self->raw_length + 1;
1914 self->length = self->raw_length + 1;
1916 }
1915 }
1917
1916
1918 return 0;
1917 return 0;
1919 bail:
1918 bail:
1920 return -1;
1919 return -1;
1921 }
1920 }
1922
1921
1923 static PyObject *index_nodemap(indexObject *self)
1922 static PyObject *index_nodemap(indexObject *self)
1924 {
1923 {
1925 Py_INCREF(self);
1924 Py_INCREF(self);
1926 return (PyObject *)self;
1925 return (PyObject *)self;
1927 }
1926 }
1928
1927
1929 static void index_dealloc(indexObject *self)
1928 static void index_dealloc(indexObject *self)
1930 {
1929 {
1931 _index_clearcaches(self);
1930 _index_clearcaches(self);
1932 Py_XDECREF(self->filteredrevs);
1931 Py_XDECREF(self->filteredrevs);
1933 if (self->buf.buf) {
1932 if (self->buf.buf) {
1934 PyBuffer_Release(&self->buf);
1933 PyBuffer_Release(&self->buf);
1935 memset(&self->buf, 0, sizeof(self->buf));
1934 memset(&self->buf, 0, sizeof(self->buf));
1936 }
1935 }
1937 Py_XDECREF(self->data);
1936 Py_XDECREF(self->data);
1938 Py_XDECREF(self->added);
1937 Py_XDECREF(self->added);
1939 PyObject_Del(self);
1938 PyObject_Del(self);
1940 }
1939 }
1941
1940
1942 static PySequenceMethods index_sequence_methods = {
1941 static PySequenceMethods index_sequence_methods = {
1943 (lenfunc)index_length, /* sq_length */
1942 (lenfunc)index_length, /* sq_length */
1944 0, /* sq_concat */
1943 0, /* sq_concat */
1945 0, /* sq_repeat */
1944 0, /* sq_repeat */
1946 (ssizeargfunc)index_get, /* sq_item */
1945 (ssizeargfunc)index_get, /* sq_item */
1947 0, /* sq_slice */
1946 0, /* sq_slice */
1948 0, /* sq_ass_item */
1947 0, /* sq_ass_item */
1949 0, /* sq_ass_slice */
1948 0, /* sq_ass_slice */
1950 (objobjproc)index_contains, /* sq_contains */
1949 (objobjproc)index_contains, /* sq_contains */
1951 };
1950 };
1952
1951
1953 static PyMappingMethods index_mapping_methods = {
1952 static PyMappingMethods index_mapping_methods = {
1954 (lenfunc)index_length, /* mp_length */
1953 (lenfunc)index_length, /* mp_length */
1955 (binaryfunc)index_getitem, /* mp_subscript */
1954 (binaryfunc)index_getitem, /* mp_subscript */
1956 (objobjargproc)index_assign_subscript, /* mp_ass_subscript */
1955 (objobjargproc)index_assign_subscript, /* mp_ass_subscript */
1957 };
1956 };
1958
1957
1959 static PyMethodDef index_methods[] = {
1958 static PyMethodDef index_methods[] = {
1960 {"ancestors", (PyCFunction)index_ancestors, METH_VARARGS,
1959 {"ancestors", (PyCFunction)index_ancestors, METH_VARARGS,
1961 "return the gca set of the given revs"},
1960 "return the gca set of the given revs"},
1962 {"commonancestorsheads", (PyCFunction)index_commonancestorsheads,
1961 {"commonancestorsheads", (PyCFunction)index_commonancestorsheads,
1963 METH_VARARGS,
1962 METH_VARARGS,
1964 "return the heads of the common ancestors of the given revs"},
1963 "return the heads of the common ancestors of the given revs"},
1965 {"clearcaches", (PyCFunction)index_clearcaches, METH_NOARGS,
1964 {"clearcaches", (PyCFunction)index_clearcaches, METH_NOARGS,
1966 "clear the index caches"},
1965 "clear the index caches"},
1967 {"get", (PyCFunction)index_m_get, METH_VARARGS,
1966 {"get", (PyCFunction)index_m_get, METH_VARARGS,
1968 "get an index entry"},
1967 "get an index entry"},
1969 {"computephasesmapsets", (PyCFunction)compute_phases_map_sets,
1968 {"computephasesmapsets", (PyCFunction)compute_phases_map_sets,
1970 METH_VARARGS, "compute phases"},
1969 METH_VARARGS, "compute phases"},
1971 {"reachableroots2", (PyCFunction)reachableroots2, METH_VARARGS,
1970 {"reachableroots2", (PyCFunction)reachableroots2, METH_VARARGS,
1972 "reachableroots"},
1971 "reachableroots"},
1973 {"headrevs", (PyCFunction)index_headrevs, METH_VARARGS,
1972 {"headrevs", (PyCFunction)index_headrevs, METH_VARARGS,
1974 "get head revisions"}, /* Can do filtering since 3.2 */
1973 "get head revisions"}, /* Can do filtering since 3.2 */
1975 {"headrevsfiltered", (PyCFunction)index_headrevs, METH_VARARGS,
1974 {"headrevsfiltered", (PyCFunction)index_headrevs, METH_VARARGS,
1976 "get filtered head revisions"}, /* Can always do filtering */
1975 "get filtered head revisions"}, /* Can always do filtering */
1977 {"deltachain", (PyCFunction)index_deltachain, METH_VARARGS,
1976 {"deltachain", (PyCFunction)index_deltachain, METH_VARARGS,
1978 "determine revisions with deltas to reconstruct fulltext"},
1977 "determine revisions with deltas to reconstruct fulltext"},
1979 {"insert", (PyCFunction)index_insert, METH_VARARGS,
1978 {"insert", (PyCFunction)index_insert, METH_VARARGS,
1980 "insert an index entry"},
1979 "insert an index entry"},
1981 {"partialmatch", (PyCFunction)index_partialmatch, METH_VARARGS,
1980 {"partialmatch", (PyCFunction)index_partialmatch, METH_VARARGS,
1982 "match a potentially ambiguous node ID"},
1981 "match a potentially ambiguous node ID"},
1983 {"stats", (PyCFunction)index_stats, METH_NOARGS,
1982 {"stats", (PyCFunction)index_stats, METH_NOARGS,
1984 "stats for the index"},
1983 "stats for the index"},
1985 {NULL} /* Sentinel */
1984 {NULL} /* Sentinel */
1986 };
1985 };
1987
1986
1988 static PyGetSetDef index_getset[] = {
1987 static PyGetSetDef index_getset[] = {
1989 {"nodemap", (getter)index_nodemap, NULL, "nodemap", NULL},
1988 {"nodemap", (getter)index_nodemap, NULL, "nodemap", NULL},
1990 {NULL} /* Sentinel */
1989 {NULL} /* Sentinel */
1991 };
1990 };
1992
1991
1993 static PyTypeObject indexType = {
1992 static PyTypeObject indexType = {
1994 PyVarObject_HEAD_INIT(NULL, 0)
1993 PyVarObject_HEAD_INIT(NULL, 0)
1995 "parsers.index", /* tp_name */
1994 "parsers.index", /* tp_name */
1996 sizeof(indexObject), /* tp_basicsize */
1995 sizeof(indexObject), /* tp_basicsize */
1997 0, /* tp_itemsize */
1996 0, /* tp_itemsize */
1998 (destructor)index_dealloc, /* tp_dealloc */
1997 (destructor)index_dealloc, /* tp_dealloc */
1999 0, /* tp_print */
1998 0, /* tp_print */
2000 0, /* tp_getattr */
1999 0, /* tp_getattr */
2001 0, /* tp_setattr */
2000 0, /* tp_setattr */
2002 0, /* tp_compare */
2001 0, /* tp_compare */
2003 0, /* tp_repr */
2002 0, /* tp_repr */
2004 0, /* tp_as_number */
2003 0, /* tp_as_number */
2005 &index_sequence_methods, /* tp_as_sequence */
2004 &index_sequence_methods, /* tp_as_sequence */
2006 &index_mapping_methods, /* tp_as_mapping */
2005 &index_mapping_methods, /* tp_as_mapping */
2007 0, /* tp_hash */
2006 0, /* tp_hash */
2008 0, /* tp_call */
2007 0, /* tp_call */
2009 0, /* tp_str */
2008 0, /* tp_str */
2010 0, /* tp_getattro */
2009 0, /* tp_getattro */
2011 0, /* tp_setattro */
2010 0, /* tp_setattro */
2012 0, /* tp_as_buffer */
2011 0, /* tp_as_buffer */
2013 Py_TPFLAGS_DEFAULT, /* tp_flags */
2012 Py_TPFLAGS_DEFAULT, /* tp_flags */
2014 "revlog index", /* tp_doc */
2013 "revlog index", /* tp_doc */
2015 0, /* tp_traverse */
2014 0, /* tp_traverse */
2016 0, /* tp_clear */
2015 0, /* tp_clear */
2017 0, /* tp_richcompare */
2016 0, /* tp_richcompare */
2018 0, /* tp_weaklistoffset */
2017 0, /* tp_weaklistoffset */
2019 0, /* tp_iter */
2018 0, /* tp_iter */
2020 0, /* tp_iternext */
2019 0, /* tp_iternext */
2021 index_methods, /* tp_methods */
2020 index_methods, /* tp_methods */
2022 0, /* tp_members */
2021 0, /* tp_members */
2023 index_getset, /* tp_getset */
2022 index_getset, /* tp_getset */
2024 0, /* tp_base */
2023 0, /* tp_base */
2025 0, /* tp_dict */
2024 0, /* tp_dict */
2026 0, /* tp_descr_get */
2025 0, /* tp_descr_get */
2027 0, /* tp_descr_set */
2026 0, /* tp_descr_set */
2028 0, /* tp_dictoffset */
2027 0, /* tp_dictoffset */
2029 (initproc)index_init, /* tp_init */
2028 (initproc)index_init, /* tp_init */
2030 0, /* tp_alloc */
2029 0, /* tp_alloc */
2031 };
2030 };
2032
2031
2033 /*
2032 /*
2034 * returns a tuple of the form (index, index, cache) with elements as
2033 * returns a tuple of the form (index, index, cache) with elements as
2035 * follows:
2034 * follows:
2036 *
2035 *
2037 * index: an index object that lazily parses RevlogNG records
2036 * index: an index object that lazily parses RevlogNG records
2038 * cache: if data is inlined, a tuple (0, index_file_content), else None
2037 * cache: if data is inlined, a tuple (0, index_file_content), else None
2039 * index_file_content could be a string, or a buffer
2038 * index_file_content could be a string, or a buffer
2040 *
2039 *
2041 * added complications are for backwards compatibility
2040 * added complications are for backwards compatibility
2042 */
2041 */
2043 PyObject *parse_index2(PyObject *self, PyObject *args)
2042 PyObject *parse_index2(PyObject *self, PyObject *args)
2044 {
2043 {
2045 PyObject *tuple = NULL, *cache = NULL;
2044 PyObject *tuple = NULL, *cache = NULL;
2046 indexObject *idx;
2045 indexObject *idx;
2047 int ret;
2046 int ret;
2048
2047
2049 idx = PyObject_New(indexObject, &indexType);
2048 idx = PyObject_New(indexObject, &indexType);
2050 if (idx == NULL)
2049 if (idx == NULL)
2051 goto bail;
2050 goto bail;
2052
2051
2053 ret = index_init(idx, args);
2052 ret = index_init(idx, args);
2054 if (ret == -1)
2053 if (ret == -1)
2055 goto bail;
2054 goto bail;
2056
2055
2057 if (idx->inlined) {
2056 if (idx->inlined) {
2058 cache = Py_BuildValue("iO", 0, idx->data);
2057 cache = Py_BuildValue("iO", 0, idx->data);
2059 if (cache == NULL)
2058 if (cache == NULL)
2060 goto bail;
2059 goto bail;
2061 } else {
2060 } else {
2062 cache = Py_None;
2061 cache = Py_None;
2063 Py_INCREF(cache);
2062 Py_INCREF(cache);
2064 }
2063 }
2065
2064
2066 tuple = Py_BuildValue("NN", idx, cache);
2065 tuple = Py_BuildValue("NN", idx, cache);
2067 if (!tuple)
2066 if (!tuple)
2068 goto bail;
2067 goto bail;
2069 return tuple;
2068 return tuple;
2070
2069
2071 bail:
2070 bail:
2072 Py_XDECREF(idx);
2071 Py_XDECREF(idx);
2073 Py_XDECREF(cache);
2072 Py_XDECREF(cache);
2074 Py_XDECREF(tuple);
2073 Py_XDECREF(tuple);
2075 return NULL;
2074 return NULL;
2076 }
2075 }
2077
2076
2078 void revlog_module_init(PyObject *mod)
2077 void revlog_module_init(PyObject *mod)
2079 {
2078 {
2080 indexType.tp_new = PyType_GenericNew;
2079 indexType.tp_new = PyType_GenericNew;
2081 if (PyType_Ready(&indexType) < 0)
2080 if (PyType_Ready(&indexType) < 0)
2082 return;
2081 return;
2083 Py_INCREF(&indexType);
2082 Py_INCREF(&indexType);
2084 PyModule_AddObject(mod, "index", (PyObject *)&indexType);
2083 PyModule_AddObject(mod, "index", (PyObject *)&indexType);
2085
2084
2086 nullentry = Py_BuildValue("iiiiiiis#", 0, 0, 0,
2085 nullentry = Py_BuildValue("iiiiiiis#", 0, 0, 0,
2087 -1, -1, -1, -1, nullid, 20);
2086 -1, -1, -1, -1, nullid, 20);
2088 if (nullentry)
2087 if (nullentry)
2089 PyObject_GC_UnTrack(nullentry);
2088 PyObject_GC_UnTrack(nullentry);
2090 }
2089 }
General Comments 0
You need to be logged in to leave comments. Login now