##// END OF EJS Templates
dirstate-entry: add a `added` property...
marmoute -
r48315:8bcae9bf default
parent child Browse files
Show More
@@ -1,860 +1,870 b''
1 /*
1 /*
2 parsers.c - efficient content parsing
2 parsers.c - efficient content parsing
3
3
4 Copyright 2008 Olivia Mackall <olivia@selenic.com> and others
4 Copyright 2008 Olivia Mackall <olivia@selenic.com> and others
5
5
6 This software may be used and distributed according to the terms of
6 This software may be used and distributed according to the terms of
7 the GNU General Public License, incorporated herein by reference.
7 the GNU General Public License, incorporated herein by reference.
8 */
8 */
9
9
10 #define PY_SSIZE_T_CLEAN
10 #define PY_SSIZE_T_CLEAN
11 #include <Python.h>
11 #include <Python.h>
12 #include <ctype.h>
12 #include <ctype.h>
13 #include <stddef.h>
13 #include <stddef.h>
14 #include <string.h>
14 #include <string.h>
15
15
16 #include "bitmanipulation.h"
16 #include "bitmanipulation.h"
17 #include "charencode.h"
17 #include "charencode.h"
18 #include "util.h"
18 #include "util.h"
19
19
20 #ifdef IS_PY3K
20 #ifdef IS_PY3K
21 /* The mapping of Python types is meant to be temporary to get Python
21 /* The mapping of Python types is meant to be temporary to get Python
22 * 3 to compile. We should remove this once Python 3 support is fully
22 * 3 to compile. We should remove this once Python 3 support is fully
23 * supported and proper types are used in the extensions themselves. */
23 * supported and proper types are used in the extensions themselves. */
24 #define PyInt_Check PyLong_Check
24 #define PyInt_Check PyLong_Check
25 #define PyInt_FromLong PyLong_FromLong
25 #define PyInt_FromLong PyLong_FromLong
26 #define PyInt_FromSsize_t PyLong_FromSsize_t
26 #define PyInt_FromSsize_t PyLong_FromSsize_t
27 #define PyInt_AsLong PyLong_AsLong
27 #define PyInt_AsLong PyLong_AsLong
28 #endif
28 #endif
29
29
30 static const char *const versionerrortext = "Python minor version mismatch";
30 static const char *const versionerrortext = "Python minor version mismatch";
31
31
32 static const int dirstate_v1_from_p2 = -2;
32 static const int dirstate_v1_from_p2 = -2;
33 static const int dirstate_v1_nonnormal = -1;
33 static const int dirstate_v1_nonnormal = -1;
34
34
35 static PyObject *dict_new_presized(PyObject *self, PyObject *args)
35 static PyObject *dict_new_presized(PyObject *self, PyObject *args)
36 {
36 {
37 Py_ssize_t expected_size;
37 Py_ssize_t expected_size;
38
38
39 if (!PyArg_ParseTuple(args, "n:make_presized_dict", &expected_size)) {
39 if (!PyArg_ParseTuple(args, "n:make_presized_dict", &expected_size)) {
40 return NULL;
40 return NULL;
41 }
41 }
42
42
43 return _dict_new_presized(expected_size);
43 return _dict_new_presized(expected_size);
44 }
44 }
45
45
46 static inline dirstateTupleObject *make_dirstate_tuple(char state, int mode,
46 static inline dirstateTupleObject *make_dirstate_tuple(char state, int mode,
47 int size, int mtime)
47 int size, int mtime)
48 {
48 {
49 dirstateTupleObject *t =
49 dirstateTupleObject *t =
50 PyObject_New(dirstateTupleObject, &dirstateTupleType);
50 PyObject_New(dirstateTupleObject, &dirstateTupleType);
51 if (!t) {
51 if (!t) {
52 return NULL;
52 return NULL;
53 }
53 }
54 t->state = state;
54 t->state = state;
55 t->mode = mode;
55 t->mode = mode;
56 t->size = size;
56 t->size = size;
57 t->mtime = mtime;
57 t->mtime = mtime;
58 return t;
58 return t;
59 }
59 }
60
60
61 static PyObject *dirstate_tuple_new(PyTypeObject *subtype, PyObject *args,
61 static PyObject *dirstate_tuple_new(PyTypeObject *subtype, PyObject *args,
62 PyObject *kwds)
62 PyObject *kwds)
63 {
63 {
64 /* We do all the initialization here and not a tp_init function because
64 /* We do all the initialization here and not a tp_init function because
65 * dirstate_tuple is immutable. */
65 * dirstate_tuple is immutable. */
66 dirstateTupleObject *t;
66 dirstateTupleObject *t;
67 char state;
67 char state;
68 int size, mode, mtime;
68 int size, mode, mtime;
69 if (!PyArg_ParseTuple(args, "ciii", &state, &mode, &size, &mtime)) {
69 if (!PyArg_ParseTuple(args, "ciii", &state, &mode, &size, &mtime)) {
70 return NULL;
70 return NULL;
71 }
71 }
72
72
73 t = (dirstateTupleObject *)subtype->tp_alloc(subtype, 1);
73 t = (dirstateTupleObject *)subtype->tp_alloc(subtype, 1);
74 if (!t) {
74 if (!t) {
75 return NULL;
75 return NULL;
76 }
76 }
77 t->state = state;
77 t->state = state;
78 t->mode = mode;
78 t->mode = mode;
79 t->size = size;
79 t->size = size;
80 t->mtime = mtime;
80 t->mtime = mtime;
81
81
82 return (PyObject *)t;
82 return (PyObject *)t;
83 }
83 }
84
84
85 static void dirstate_tuple_dealloc(PyObject *o)
85 static void dirstate_tuple_dealloc(PyObject *o)
86 {
86 {
87 PyObject_Del(o);
87 PyObject_Del(o);
88 }
88 }
89
89
90 static Py_ssize_t dirstate_tuple_length(PyObject *o)
90 static Py_ssize_t dirstate_tuple_length(PyObject *o)
91 {
91 {
92 return 4;
92 return 4;
93 }
93 }
94
94
95 static PyObject *dirstate_tuple_item(PyObject *o, Py_ssize_t i)
95 static PyObject *dirstate_tuple_item(PyObject *o, Py_ssize_t i)
96 {
96 {
97 dirstateTupleObject *t = (dirstateTupleObject *)o;
97 dirstateTupleObject *t = (dirstateTupleObject *)o;
98 switch (i) {
98 switch (i) {
99 case 0:
99 case 0:
100 return PyBytes_FromStringAndSize(&t->state, 1);
100 return PyBytes_FromStringAndSize(&t->state, 1);
101 case 1:
101 case 1:
102 return PyInt_FromLong(t->mode);
102 return PyInt_FromLong(t->mode);
103 case 2:
103 case 2:
104 return PyInt_FromLong(t->size);
104 return PyInt_FromLong(t->size);
105 case 3:
105 case 3:
106 return PyInt_FromLong(t->mtime);
106 return PyInt_FromLong(t->mtime);
107 default:
107 default:
108 PyErr_SetString(PyExc_IndexError, "index out of range");
108 PyErr_SetString(PyExc_IndexError, "index out of range");
109 return NULL;
109 return NULL;
110 }
110 }
111 }
111 }
112
112
113 static PySequenceMethods dirstate_tuple_sq = {
113 static PySequenceMethods dirstate_tuple_sq = {
114 dirstate_tuple_length, /* sq_length */
114 dirstate_tuple_length, /* sq_length */
115 0, /* sq_concat */
115 0, /* sq_concat */
116 0, /* sq_repeat */
116 0, /* sq_repeat */
117 dirstate_tuple_item, /* sq_item */
117 dirstate_tuple_item, /* sq_item */
118 0, /* sq_ass_item */
118 0, /* sq_ass_item */
119 0, /* sq_contains */
119 0, /* sq_contains */
120 0, /* sq_inplace_concat */
120 0, /* sq_inplace_concat */
121 0 /* sq_inplace_repeat */
121 0 /* sq_inplace_repeat */
122 };
122 };
123
123
124 static PyObject *dirstatetuple_v1_state(dirstateTupleObject *self)
124 static PyObject *dirstatetuple_v1_state(dirstateTupleObject *self)
125 {
125 {
126 return PyBytes_FromStringAndSize(&self->state, 1);
126 return PyBytes_FromStringAndSize(&self->state, 1);
127 };
127 };
128
128
129 static PyObject *dirstatetuple_v1_mode(dirstateTupleObject *self)
129 static PyObject *dirstatetuple_v1_mode(dirstateTupleObject *self)
130 {
130 {
131 return PyInt_FromLong(self->mode);
131 return PyInt_FromLong(self->mode);
132 };
132 };
133
133
134 static PyObject *dirstatetuple_v1_size(dirstateTupleObject *self)
134 static PyObject *dirstatetuple_v1_size(dirstateTupleObject *self)
135 {
135 {
136 return PyInt_FromLong(self->size);
136 return PyInt_FromLong(self->size);
137 };
137 };
138
138
139 static PyObject *dirstatetuple_v1_mtime(dirstateTupleObject *self)
139 static PyObject *dirstatetuple_v1_mtime(dirstateTupleObject *self)
140 {
140 {
141 return PyInt_FromLong(self->mtime);
141 return PyInt_FromLong(self->mtime);
142 };
142 };
143
143
144 static PyMethodDef dirstatetuple_methods[] = {
144 static PyMethodDef dirstatetuple_methods[] = {
145 {"v1_state", (PyCFunction)dirstatetuple_v1_state, METH_NOARGS,
145 {"v1_state", (PyCFunction)dirstatetuple_v1_state, METH_NOARGS,
146 "return a \"state\" suitable for v1 serialization"},
146 "return a \"state\" suitable for v1 serialization"},
147 {"v1_mode", (PyCFunction)dirstatetuple_v1_mode, METH_NOARGS,
147 {"v1_mode", (PyCFunction)dirstatetuple_v1_mode, METH_NOARGS,
148 "return a \"mode\" suitable for v1 serialization"},
148 "return a \"mode\" suitable for v1 serialization"},
149 {"v1_size", (PyCFunction)dirstatetuple_v1_size, METH_NOARGS,
149 {"v1_size", (PyCFunction)dirstatetuple_v1_size, METH_NOARGS,
150 "return a \"size\" suitable for v1 serialization"},
150 "return a \"size\" suitable for v1 serialization"},
151 {"v1_mtime", (PyCFunction)dirstatetuple_v1_mtime, METH_NOARGS,
151 {"v1_mtime", (PyCFunction)dirstatetuple_v1_mtime, METH_NOARGS,
152 "return a \"mtime\" suitable for v1 serialization"},
152 "return a \"mtime\" suitable for v1 serialization"},
153 {NULL} /* Sentinel */
153 {NULL} /* Sentinel */
154 };
154 };
155
155
156 static PyObject *dirstatetuple_get_state(dirstateTupleObject *self)
156 static PyObject *dirstatetuple_get_state(dirstateTupleObject *self)
157 {
157 {
158 return PyBytes_FromStringAndSize(&self->state, 1);
158 return PyBytes_FromStringAndSize(&self->state, 1);
159 };
159 };
160
160
161 static PyObject *dirstatetuple_get_added(dirstateTupleObject *self)
162 {
163 if (self->state == 'a') {
164 Py_RETURN_TRUE;
165 } else {
166 Py_RETURN_FALSE;
167 }
168 };
169
161 static PyObject *dirstatetuple_get_merged(dirstateTupleObject *self)
170 static PyObject *dirstatetuple_get_merged(dirstateTupleObject *self)
162 {
171 {
163 if (self->state == 'm') {
172 if (self->state == 'm') {
164 Py_RETURN_TRUE;
173 Py_RETURN_TRUE;
165 } else {
174 } else {
166 Py_RETURN_FALSE;
175 Py_RETURN_FALSE;
167 }
176 }
168 };
177 };
169
178
170 static PyObject *dirstatetuple_get_merged_removed(dirstateTupleObject *self)
179 static PyObject *dirstatetuple_get_merged_removed(dirstateTupleObject *self)
171 {
180 {
172 if (self->state == 'r' && self->size == dirstate_v1_nonnormal) {
181 if (self->state == 'r' && self->size == dirstate_v1_nonnormal) {
173 Py_RETURN_TRUE;
182 Py_RETURN_TRUE;
174 } else {
183 } else {
175 Py_RETURN_FALSE;
184 Py_RETURN_FALSE;
176 }
185 }
177 };
186 };
178
187
179 static PyObject *dirstatetuple_get_from_p2(dirstateTupleObject *self)
188 static PyObject *dirstatetuple_get_from_p2(dirstateTupleObject *self)
180 {
189 {
181 if (self->state == 'n' && self->size == dirstate_v1_from_p2) {
190 if (self->state == 'n' && self->size == dirstate_v1_from_p2) {
182 Py_RETURN_TRUE;
191 Py_RETURN_TRUE;
183 } else {
192 } else {
184 Py_RETURN_FALSE;
193 Py_RETURN_FALSE;
185 }
194 }
186 };
195 };
187
196
188 static PyObject *dirstatetuple_get_from_p2_removed(dirstateTupleObject *self)
197 static PyObject *dirstatetuple_get_from_p2_removed(dirstateTupleObject *self)
189 {
198 {
190 if (self->state == 'r' && self->size == dirstate_v1_from_p2) {
199 if (self->state == 'r' && self->size == dirstate_v1_from_p2) {
191 Py_RETURN_TRUE;
200 Py_RETURN_TRUE;
192 } else {
201 } else {
193 Py_RETURN_FALSE;
202 Py_RETURN_FALSE;
194 }
203 }
195 };
204 };
196
205
197 static PyObject *dirstatetuple_get_removed(dirstateTupleObject *self)
206 static PyObject *dirstatetuple_get_removed(dirstateTupleObject *self)
198 {
207 {
199 if (self->state == 'r') {
208 if (self->state == 'r') {
200 Py_RETURN_TRUE;
209 Py_RETURN_TRUE;
201 } else {
210 } else {
202 Py_RETURN_FALSE;
211 Py_RETURN_FALSE;
203 }
212 }
204 };
213 };
205
214
206 static PyGetSetDef dirstatetuple_getset[] = {
215 static PyGetSetDef dirstatetuple_getset[] = {
207 {"state", (getter)dirstatetuple_get_state, NULL, "state", NULL},
216 {"state", (getter)dirstatetuple_get_state, NULL, "state", NULL},
217 {"added", (getter)dirstatetuple_get_added, NULL, "added", NULL},
208 {"merged_removed", (getter)dirstatetuple_get_merged_removed, NULL,
218 {"merged_removed", (getter)dirstatetuple_get_merged_removed, NULL,
209 "merged_removed", NULL},
219 "merged_removed", NULL},
210 {"merged", (getter)dirstatetuple_get_merged, NULL, "merged", NULL},
220 {"merged", (getter)dirstatetuple_get_merged, NULL, "merged", NULL},
211 {"from_p2_removed", (getter)dirstatetuple_get_from_p2_removed, NULL,
221 {"from_p2_removed", (getter)dirstatetuple_get_from_p2_removed, NULL,
212 "from_p2_removed", NULL},
222 "from_p2_removed", NULL},
213 {"from_p2", (getter)dirstatetuple_get_from_p2, NULL, "from_p2", NULL},
223 {"from_p2", (getter)dirstatetuple_get_from_p2, NULL, "from_p2", NULL},
214 {"removed", (getter)dirstatetuple_get_removed, NULL, "removed", NULL},
224 {"removed", (getter)dirstatetuple_get_removed, NULL, "removed", NULL},
215 {NULL} /* Sentinel */
225 {NULL} /* Sentinel */
216 };
226 };
217
227
218 PyTypeObject dirstateTupleType = {
228 PyTypeObject dirstateTupleType = {
219 PyVarObject_HEAD_INIT(NULL, 0) /* header */
229 PyVarObject_HEAD_INIT(NULL, 0) /* header */
220 "dirstate_tuple", /* tp_name */
230 "dirstate_tuple", /* tp_name */
221 sizeof(dirstateTupleObject), /* tp_basicsize */
231 sizeof(dirstateTupleObject), /* tp_basicsize */
222 0, /* tp_itemsize */
232 0, /* tp_itemsize */
223 (destructor)dirstate_tuple_dealloc, /* tp_dealloc */
233 (destructor)dirstate_tuple_dealloc, /* tp_dealloc */
224 0, /* tp_print */
234 0, /* tp_print */
225 0, /* tp_getattr */
235 0, /* tp_getattr */
226 0, /* tp_setattr */
236 0, /* tp_setattr */
227 0, /* tp_compare */
237 0, /* tp_compare */
228 0, /* tp_repr */
238 0, /* tp_repr */
229 0, /* tp_as_number */
239 0, /* tp_as_number */
230 &dirstate_tuple_sq, /* tp_as_sequence */
240 &dirstate_tuple_sq, /* tp_as_sequence */
231 0, /* tp_as_mapping */
241 0, /* tp_as_mapping */
232 0, /* tp_hash */
242 0, /* tp_hash */
233 0, /* tp_call */
243 0, /* tp_call */
234 0, /* tp_str */
244 0, /* tp_str */
235 0, /* tp_getattro */
245 0, /* tp_getattro */
236 0, /* tp_setattro */
246 0, /* tp_setattro */
237 0, /* tp_as_buffer */
247 0, /* tp_as_buffer */
238 Py_TPFLAGS_DEFAULT, /* tp_flags */
248 Py_TPFLAGS_DEFAULT, /* tp_flags */
239 "dirstate tuple", /* tp_doc */
249 "dirstate tuple", /* tp_doc */
240 0, /* tp_traverse */
250 0, /* tp_traverse */
241 0, /* tp_clear */
251 0, /* tp_clear */
242 0, /* tp_richcompare */
252 0, /* tp_richcompare */
243 0, /* tp_weaklistoffset */
253 0, /* tp_weaklistoffset */
244 0, /* tp_iter */
254 0, /* tp_iter */
245 0, /* tp_iternext */
255 0, /* tp_iternext */
246 dirstatetuple_methods, /* tp_methods */
256 dirstatetuple_methods, /* tp_methods */
247 0, /* tp_members */
257 0, /* tp_members */
248 dirstatetuple_getset, /* tp_getset */
258 dirstatetuple_getset, /* tp_getset */
249 0, /* tp_base */
259 0, /* tp_base */
250 0, /* tp_dict */
260 0, /* tp_dict */
251 0, /* tp_descr_get */
261 0, /* tp_descr_get */
252 0, /* tp_descr_set */
262 0, /* tp_descr_set */
253 0, /* tp_dictoffset */
263 0, /* tp_dictoffset */
254 0, /* tp_init */
264 0, /* tp_init */
255 0, /* tp_alloc */
265 0, /* tp_alloc */
256 dirstate_tuple_new, /* tp_new */
266 dirstate_tuple_new, /* tp_new */
257 };
267 };
258
268
259 static PyObject *parse_dirstate(PyObject *self, PyObject *args)
269 static PyObject *parse_dirstate(PyObject *self, PyObject *args)
260 {
270 {
261 PyObject *dmap, *cmap, *parents = NULL, *ret = NULL;
271 PyObject *dmap, *cmap, *parents = NULL, *ret = NULL;
262 PyObject *fname = NULL, *cname = NULL, *entry = NULL;
272 PyObject *fname = NULL, *cname = NULL, *entry = NULL;
263 char state, *cur, *str, *cpos;
273 char state, *cur, *str, *cpos;
264 int mode, size, mtime;
274 int mode, size, mtime;
265 unsigned int flen, pos = 40;
275 unsigned int flen, pos = 40;
266 Py_ssize_t len = 40;
276 Py_ssize_t len = 40;
267 Py_ssize_t readlen;
277 Py_ssize_t readlen;
268
278
269 if (!PyArg_ParseTuple(
279 if (!PyArg_ParseTuple(
270 args, PY23("O!O!s#:parse_dirstate", "O!O!y#:parse_dirstate"),
280 args, PY23("O!O!s#:parse_dirstate", "O!O!y#:parse_dirstate"),
271 &PyDict_Type, &dmap, &PyDict_Type, &cmap, &str, &readlen)) {
281 &PyDict_Type, &dmap, &PyDict_Type, &cmap, &str, &readlen)) {
272 goto quit;
282 goto quit;
273 }
283 }
274
284
275 len = readlen;
285 len = readlen;
276
286
277 /* read parents */
287 /* read parents */
278 if (len < 40) {
288 if (len < 40) {
279 PyErr_SetString(PyExc_ValueError,
289 PyErr_SetString(PyExc_ValueError,
280 "too little data for parents");
290 "too little data for parents");
281 goto quit;
291 goto quit;
282 }
292 }
283
293
284 parents = Py_BuildValue(PY23("s#s#", "y#y#"), str, (Py_ssize_t)20,
294 parents = Py_BuildValue(PY23("s#s#", "y#y#"), str, (Py_ssize_t)20,
285 str + 20, (Py_ssize_t)20);
295 str + 20, (Py_ssize_t)20);
286 if (!parents) {
296 if (!parents) {
287 goto quit;
297 goto quit;
288 }
298 }
289
299
290 /* read filenames */
300 /* read filenames */
291 while (pos >= 40 && pos < len) {
301 while (pos >= 40 && pos < len) {
292 if (pos + 17 > len) {
302 if (pos + 17 > len) {
293 PyErr_SetString(PyExc_ValueError,
303 PyErr_SetString(PyExc_ValueError,
294 "overflow in dirstate");
304 "overflow in dirstate");
295 goto quit;
305 goto quit;
296 }
306 }
297 cur = str + pos;
307 cur = str + pos;
298 /* unpack header */
308 /* unpack header */
299 state = *cur;
309 state = *cur;
300 mode = getbe32(cur + 1);
310 mode = getbe32(cur + 1);
301 size = getbe32(cur + 5);
311 size = getbe32(cur + 5);
302 mtime = getbe32(cur + 9);
312 mtime = getbe32(cur + 9);
303 flen = getbe32(cur + 13);
313 flen = getbe32(cur + 13);
304 pos += 17;
314 pos += 17;
305 cur += 17;
315 cur += 17;
306 if (flen > len - pos) {
316 if (flen > len - pos) {
307 PyErr_SetString(PyExc_ValueError,
317 PyErr_SetString(PyExc_ValueError,
308 "overflow in dirstate");
318 "overflow in dirstate");
309 goto quit;
319 goto quit;
310 }
320 }
311
321
312 entry =
322 entry =
313 (PyObject *)make_dirstate_tuple(state, mode, size, mtime);
323 (PyObject *)make_dirstate_tuple(state, mode, size, mtime);
314 cpos = memchr(cur, 0, flen);
324 cpos = memchr(cur, 0, flen);
315 if (cpos) {
325 if (cpos) {
316 fname = PyBytes_FromStringAndSize(cur, cpos - cur);
326 fname = PyBytes_FromStringAndSize(cur, cpos - cur);
317 cname = PyBytes_FromStringAndSize(
327 cname = PyBytes_FromStringAndSize(
318 cpos + 1, flen - (cpos - cur) - 1);
328 cpos + 1, flen - (cpos - cur) - 1);
319 if (!fname || !cname ||
329 if (!fname || !cname ||
320 PyDict_SetItem(cmap, fname, cname) == -1 ||
330 PyDict_SetItem(cmap, fname, cname) == -1 ||
321 PyDict_SetItem(dmap, fname, entry) == -1) {
331 PyDict_SetItem(dmap, fname, entry) == -1) {
322 goto quit;
332 goto quit;
323 }
333 }
324 Py_DECREF(cname);
334 Py_DECREF(cname);
325 } else {
335 } else {
326 fname = PyBytes_FromStringAndSize(cur, flen);
336 fname = PyBytes_FromStringAndSize(cur, flen);
327 if (!fname ||
337 if (!fname ||
328 PyDict_SetItem(dmap, fname, entry) == -1) {
338 PyDict_SetItem(dmap, fname, entry) == -1) {
329 goto quit;
339 goto quit;
330 }
340 }
331 }
341 }
332 Py_DECREF(fname);
342 Py_DECREF(fname);
333 Py_DECREF(entry);
343 Py_DECREF(entry);
334 fname = cname = entry = NULL;
344 fname = cname = entry = NULL;
335 pos += flen;
345 pos += flen;
336 }
346 }
337
347
338 ret = parents;
348 ret = parents;
339 Py_INCREF(ret);
349 Py_INCREF(ret);
340 quit:
350 quit:
341 Py_XDECREF(fname);
351 Py_XDECREF(fname);
342 Py_XDECREF(cname);
352 Py_XDECREF(cname);
343 Py_XDECREF(entry);
353 Py_XDECREF(entry);
344 Py_XDECREF(parents);
354 Py_XDECREF(parents);
345 return ret;
355 return ret;
346 }
356 }
347
357
348 /*
358 /*
349 * Build a set of non-normal and other parent entries from the dirstate dmap
359 * Build a set of non-normal and other parent entries from the dirstate dmap
350 */
360 */
351 static PyObject *nonnormalotherparententries(PyObject *self, PyObject *args)
361 static PyObject *nonnormalotherparententries(PyObject *self, PyObject *args)
352 {
362 {
353 PyObject *dmap, *fname, *v;
363 PyObject *dmap, *fname, *v;
354 PyObject *nonnset = NULL, *otherpset = NULL, *result = NULL;
364 PyObject *nonnset = NULL, *otherpset = NULL, *result = NULL;
355 Py_ssize_t pos;
365 Py_ssize_t pos;
356
366
357 if (!PyArg_ParseTuple(args, "O!:nonnormalentries", &PyDict_Type,
367 if (!PyArg_ParseTuple(args, "O!:nonnormalentries", &PyDict_Type,
358 &dmap)) {
368 &dmap)) {
359 goto bail;
369 goto bail;
360 }
370 }
361
371
362 nonnset = PySet_New(NULL);
372 nonnset = PySet_New(NULL);
363 if (nonnset == NULL) {
373 if (nonnset == NULL) {
364 goto bail;
374 goto bail;
365 }
375 }
366
376
367 otherpset = PySet_New(NULL);
377 otherpset = PySet_New(NULL);
368 if (otherpset == NULL) {
378 if (otherpset == NULL) {
369 goto bail;
379 goto bail;
370 }
380 }
371
381
372 pos = 0;
382 pos = 0;
373 while (PyDict_Next(dmap, &pos, &fname, &v)) {
383 while (PyDict_Next(dmap, &pos, &fname, &v)) {
374 dirstateTupleObject *t;
384 dirstateTupleObject *t;
375 if (!dirstate_tuple_check(v)) {
385 if (!dirstate_tuple_check(v)) {
376 PyErr_SetString(PyExc_TypeError,
386 PyErr_SetString(PyExc_TypeError,
377 "expected a dirstate tuple");
387 "expected a dirstate tuple");
378 goto bail;
388 goto bail;
379 }
389 }
380 t = (dirstateTupleObject *)v;
390 t = (dirstateTupleObject *)v;
381
391
382 if (t->state == 'n' && t->size == -2) {
392 if (t->state == 'n' && t->size == -2) {
383 if (PySet_Add(otherpset, fname) == -1) {
393 if (PySet_Add(otherpset, fname) == -1) {
384 goto bail;
394 goto bail;
385 }
395 }
386 }
396 }
387
397
388 if (t->state == 'n' && t->mtime != -1) {
398 if (t->state == 'n' && t->mtime != -1) {
389 continue;
399 continue;
390 }
400 }
391 if (PySet_Add(nonnset, fname) == -1) {
401 if (PySet_Add(nonnset, fname) == -1) {
392 goto bail;
402 goto bail;
393 }
403 }
394 }
404 }
395
405
396 result = Py_BuildValue("(OO)", nonnset, otherpset);
406 result = Py_BuildValue("(OO)", nonnset, otherpset);
397 if (result == NULL) {
407 if (result == NULL) {
398 goto bail;
408 goto bail;
399 }
409 }
400 Py_DECREF(nonnset);
410 Py_DECREF(nonnset);
401 Py_DECREF(otherpset);
411 Py_DECREF(otherpset);
402 return result;
412 return result;
403 bail:
413 bail:
404 Py_XDECREF(nonnset);
414 Py_XDECREF(nonnset);
405 Py_XDECREF(otherpset);
415 Py_XDECREF(otherpset);
406 Py_XDECREF(result);
416 Py_XDECREF(result);
407 return NULL;
417 return NULL;
408 }
418 }
409
419
410 /*
420 /*
411 * Efficiently pack a dirstate object into its on-disk format.
421 * Efficiently pack a dirstate object into its on-disk format.
412 */
422 */
413 static PyObject *pack_dirstate(PyObject *self, PyObject *args)
423 static PyObject *pack_dirstate(PyObject *self, PyObject *args)
414 {
424 {
415 PyObject *packobj = NULL;
425 PyObject *packobj = NULL;
416 PyObject *map, *copymap, *pl, *mtime_unset = NULL;
426 PyObject *map, *copymap, *pl, *mtime_unset = NULL;
417 Py_ssize_t nbytes, pos, l;
427 Py_ssize_t nbytes, pos, l;
418 PyObject *k, *v = NULL, *pn;
428 PyObject *k, *v = NULL, *pn;
419 char *p, *s;
429 char *p, *s;
420 int now;
430 int now;
421
431
422 if (!PyArg_ParseTuple(args, "O!O!O!i:pack_dirstate", &PyDict_Type, &map,
432 if (!PyArg_ParseTuple(args, "O!O!O!i:pack_dirstate", &PyDict_Type, &map,
423 &PyDict_Type, &copymap, &PyTuple_Type, &pl,
433 &PyDict_Type, &copymap, &PyTuple_Type, &pl,
424 &now)) {
434 &now)) {
425 return NULL;
435 return NULL;
426 }
436 }
427
437
428 if (PyTuple_Size(pl) != 2) {
438 if (PyTuple_Size(pl) != 2) {
429 PyErr_SetString(PyExc_TypeError, "expected 2-element tuple");
439 PyErr_SetString(PyExc_TypeError, "expected 2-element tuple");
430 return NULL;
440 return NULL;
431 }
441 }
432
442
433 /* Figure out how much we need to allocate. */
443 /* Figure out how much we need to allocate. */
434 for (nbytes = 40, pos = 0; PyDict_Next(map, &pos, &k, &v);) {
444 for (nbytes = 40, pos = 0; PyDict_Next(map, &pos, &k, &v);) {
435 PyObject *c;
445 PyObject *c;
436 if (!PyBytes_Check(k)) {
446 if (!PyBytes_Check(k)) {
437 PyErr_SetString(PyExc_TypeError, "expected string key");
447 PyErr_SetString(PyExc_TypeError, "expected string key");
438 goto bail;
448 goto bail;
439 }
449 }
440 nbytes += PyBytes_GET_SIZE(k) + 17;
450 nbytes += PyBytes_GET_SIZE(k) + 17;
441 c = PyDict_GetItem(copymap, k);
451 c = PyDict_GetItem(copymap, k);
442 if (c) {
452 if (c) {
443 if (!PyBytes_Check(c)) {
453 if (!PyBytes_Check(c)) {
444 PyErr_SetString(PyExc_TypeError,
454 PyErr_SetString(PyExc_TypeError,
445 "expected string key");
455 "expected string key");
446 goto bail;
456 goto bail;
447 }
457 }
448 nbytes += PyBytes_GET_SIZE(c) + 1;
458 nbytes += PyBytes_GET_SIZE(c) + 1;
449 }
459 }
450 }
460 }
451
461
452 packobj = PyBytes_FromStringAndSize(NULL, nbytes);
462 packobj = PyBytes_FromStringAndSize(NULL, nbytes);
453 if (packobj == NULL) {
463 if (packobj == NULL) {
454 goto bail;
464 goto bail;
455 }
465 }
456
466
457 p = PyBytes_AS_STRING(packobj);
467 p = PyBytes_AS_STRING(packobj);
458
468
459 pn = PyTuple_GET_ITEM(pl, 0);
469 pn = PyTuple_GET_ITEM(pl, 0);
460 if (PyBytes_AsStringAndSize(pn, &s, &l) == -1 || l != 20) {
470 if (PyBytes_AsStringAndSize(pn, &s, &l) == -1 || l != 20) {
461 PyErr_SetString(PyExc_TypeError, "expected a 20-byte hash");
471 PyErr_SetString(PyExc_TypeError, "expected a 20-byte hash");
462 goto bail;
472 goto bail;
463 }
473 }
464 memcpy(p, s, l);
474 memcpy(p, s, l);
465 p += 20;
475 p += 20;
466 pn = PyTuple_GET_ITEM(pl, 1);
476 pn = PyTuple_GET_ITEM(pl, 1);
467 if (PyBytes_AsStringAndSize(pn, &s, &l) == -1 || l != 20) {
477 if (PyBytes_AsStringAndSize(pn, &s, &l) == -1 || l != 20) {
468 PyErr_SetString(PyExc_TypeError, "expected a 20-byte hash");
478 PyErr_SetString(PyExc_TypeError, "expected a 20-byte hash");
469 goto bail;
479 goto bail;
470 }
480 }
471 memcpy(p, s, l);
481 memcpy(p, s, l);
472 p += 20;
482 p += 20;
473
483
474 for (pos = 0; PyDict_Next(map, &pos, &k, &v);) {
484 for (pos = 0; PyDict_Next(map, &pos, &k, &v);) {
475 dirstateTupleObject *tuple;
485 dirstateTupleObject *tuple;
476 char state;
486 char state;
477 int mode, size, mtime;
487 int mode, size, mtime;
478 Py_ssize_t len, l;
488 Py_ssize_t len, l;
479 PyObject *o;
489 PyObject *o;
480 char *t;
490 char *t;
481
491
482 if (!dirstate_tuple_check(v)) {
492 if (!dirstate_tuple_check(v)) {
483 PyErr_SetString(PyExc_TypeError,
493 PyErr_SetString(PyExc_TypeError,
484 "expected a dirstate tuple");
494 "expected a dirstate tuple");
485 goto bail;
495 goto bail;
486 }
496 }
487 tuple = (dirstateTupleObject *)v;
497 tuple = (dirstateTupleObject *)v;
488
498
489 state = tuple->state;
499 state = tuple->state;
490 mode = tuple->mode;
500 mode = tuple->mode;
491 size = tuple->size;
501 size = tuple->size;
492 mtime = tuple->mtime;
502 mtime = tuple->mtime;
493 if (state == 'n' && mtime == now) {
503 if (state == 'n' && mtime == now) {
494 /* See pure/parsers.py:pack_dirstate for why we do
504 /* See pure/parsers.py:pack_dirstate for why we do
495 * this. */
505 * this. */
496 mtime = -1;
506 mtime = -1;
497 mtime_unset = (PyObject *)make_dirstate_tuple(
507 mtime_unset = (PyObject *)make_dirstate_tuple(
498 state, mode, size, mtime);
508 state, mode, size, mtime);
499 if (!mtime_unset) {
509 if (!mtime_unset) {
500 goto bail;
510 goto bail;
501 }
511 }
502 if (PyDict_SetItem(map, k, mtime_unset) == -1) {
512 if (PyDict_SetItem(map, k, mtime_unset) == -1) {
503 goto bail;
513 goto bail;
504 }
514 }
505 Py_DECREF(mtime_unset);
515 Py_DECREF(mtime_unset);
506 mtime_unset = NULL;
516 mtime_unset = NULL;
507 }
517 }
508 *p++ = state;
518 *p++ = state;
509 putbe32((uint32_t)mode, p);
519 putbe32((uint32_t)mode, p);
510 putbe32((uint32_t)size, p + 4);
520 putbe32((uint32_t)size, p + 4);
511 putbe32((uint32_t)mtime, p + 8);
521 putbe32((uint32_t)mtime, p + 8);
512 t = p + 12;
522 t = p + 12;
513 p += 16;
523 p += 16;
514 len = PyBytes_GET_SIZE(k);
524 len = PyBytes_GET_SIZE(k);
515 memcpy(p, PyBytes_AS_STRING(k), len);
525 memcpy(p, PyBytes_AS_STRING(k), len);
516 p += len;
526 p += len;
517 o = PyDict_GetItem(copymap, k);
527 o = PyDict_GetItem(copymap, k);
518 if (o) {
528 if (o) {
519 *p++ = '\0';
529 *p++ = '\0';
520 l = PyBytes_GET_SIZE(o);
530 l = PyBytes_GET_SIZE(o);
521 memcpy(p, PyBytes_AS_STRING(o), l);
531 memcpy(p, PyBytes_AS_STRING(o), l);
522 p += l;
532 p += l;
523 len += l + 1;
533 len += l + 1;
524 }
534 }
525 putbe32((uint32_t)len, t);
535 putbe32((uint32_t)len, t);
526 }
536 }
527
537
528 pos = p - PyBytes_AS_STRING(packobj);
538 pos = p - PyBytes_AS_STRING(packobj);
529 if (pos != nbytes) {
539 if (pos != nbytes) {
530 PyErr_Format(PyExc_SystemError, "bad dirstate size: %ld != %ld",
540 PyErr_Format(PyExc_SystemError, "bad dirstate size: %ld != %ld",
531 (long)pos, (long)nbytes);
541 (long)pos, (long)nbytes);
532 goto bail;
542 goto bail;
533 }
543 }
534
544
535 return packobj;
545 return packobj;
536 bail:
546 bail:
537 Py_XDECREF(mtime_unset);
547 Py_XDECREF(mtime_unset);
538 Py_XDECREF(packobj);
548 Py_XDECREF(packobj);
539 Py_XDECREF(v);
549 Py_XDECREF(v);
540 return NULL;
550 return NULL;
541 }
551 }
542
552
543 #define BUMPED_FIX 1
553 #define BUMPED_FIX 1
544 #define USING_SHA_256 2
554 #define USING_SHA_256 2
545 #define FM1_HEADER_SIZE (4 + 8 + 2 + 2 + 1 + 1 + 1)
555 #define FM1_HEADER_SIZE (4 + 8 + 2 + 2 + 1 + 1 + 1)
546
556
547 static PyObject *readshas(const char *source, unsigned char num,
557 static PyObject *readshas(const char *source, unsigned char num,
548 Py_ssize_t hashwidth)
558 Py_ssize_t hashwidth)
549 {
559 {
550 int i;
560 int i;
551 PyObject *list = PyTuple_New(num);
561 PyObject *list = PyTuple_New(num);
552 if (list == NULL) {
562 if (list == NULL) {
553 return NULL;
563 return NULL;
554 }
564 }
555 for (i = 0; i < num; i++) {
565 for (i = 0; i < num; i++) {
556 PyObject *hash = PyBytes_FromStringAndSize(source, hashwidth);
566 PyObject *hash = PyBytes_FromStringAndSize(source, hashwidth);
557 if (hash == NULL) {
567 if (hash == NULL) {
558 Py_DECREF(list);
568 Py_DECREF(list);
559 return NULL;
569 return NULL;
560 }
570 }
561 PyTuple_SET_ITEM(list, i, hash);
571 PyTuple_SET_ITEM(list, i, hash);
562 source += hashwidth;
572 source += hashwidth;
563 }
573 }
564 return list;
574 return list;
565 }
575 }
566
576
567 static PyObject *fm1readmarker(const char *databegin, const char *dataend,
577 static PyObject *fm1readmarker(const char *databegin, const char *dataend,
568 uint32_t *msize)
578 uint32_t *msize)
569 {
579 {
570 const char *data = databegin;
580 const char *data = databegin;
571 const char *meta;
581 const char *meta;
572
582
573 double mtime;
583 double mtime;
574 int16_t tz;
584 int16_t tz;
575 uint16_t flags;
585 uint16_t flags;
576 unsigned char nsuccs, nparents, nmetadata;
586 unsigned char nsuccs, nparents, nmetadata;
577 Py_ssize_t hashwidth = 20;
587 Py_ssize_t hashwidth = 20;
578
588
579 PyObject *prec = NULL, *parents = NULL, *succs = NULL;
589 PyObject *prec = NULL, *parents = NULL, *succs = NULL;
580 PyObject *metadata = NULL, *ret = NULL;
590 PyObject *metadata = NULL, *ret = NULL;
581 int i;
591 int i;
582
592
583 if (data + FM1_HEADER_SIZE > dataend) {
593 if (data + FM1_HEADER_SIZE > dataend) {
584 goto overflow;
594 goto overflow;
585 }
595 }
586
596
587 *msize = getbe32(data);
597 *msize = getbe32(data);
588 data += 4;
598 data += 4;
589 mtime = getbefloat64(data);
599 mtime = getbefloat64(data);
590 data += 8;
600 data += 8;
591 tz = getbeint16(data);
601 tz = getbeint16(data);
592 data += 2;
602 data += 2;
593 flags = getbeuint16(data);
603 flags = getbeuint16(data);
594 data += 2;
604 data += 2;
595
605
596 if (flags & USING_SHA_256) {
606 if (flags & USING_SHA_256) {
597 hashwidth = 32;
607 hashwidth = 32;
598 }
608 }
599
609
600 nsuccs = (unsigned char)(*data++);
610 nsuccs = (unsigned char)(*data++);
601 nparents = (unsigned char)(*data++);
611 nparents = (unsigned char)(*data++);
602 nmetadata = (unsigned char)(*data++);
612 nmetadata = (unsigned char)(*data++);
603
613
604 if (databegin + *msize > dataend) {
614 if (databegin + *msize > dataend) {
605 goto overflow;
615 goto overflow;
606 }
616 }
607 dataend = databegin + *msize; /* narrow down to marker size */
617 dataend = databegin + *msize; /* narrow down to marker size */
608
618
609 if (data + hashwidth > dataend) {
619 if (data + hashwidth > dataend) {
610 goto overflow;
620 goto overflow;
611 }
621 }
612 prec = PyBytes_FromStringAndSize(data, hashwidth);
622 prec = PyBytes_FromStringAndSize(data, hashwidth);
613 data += hashwidth;
623 data += hashwidth;
614 if (prec == NULL) {
624 if (prec == NULL) {
615 goto bail;
625 goto bail;
616 }
626 }
617
627
618 if (data + nsuccs * hashwidth > dataend) {
628 if (data + nsuccs * hashwidth > dataend) {
619 goto overflow;
629 goto overflow;
620 }
630 }
621 succs = readshas(data, nsuccs, hashwidth);
631 succs = readshas(data, nsuccs, hashwidth);
622 if (succs == NULL) {
632 if (succs == NULL) {
623 goto bail;
633 goto bail;
624 }
634 }
625 data += nsuccs * hashwidth;
635 data += nsuccs * hashwidth;
626
636
627 if (nparents == 1 || nparents == 2) {
637 if (nparents == 1 || nparents == 2) {
628 if (data + nparents * hashwidth > dataend) {
638 if (data + nparents * hashwidth > dataend) {
629 goto overflow;
639 goto overflow;
630 }
640 }
631 parents = readshas(data, nparents, hashwidth);
641 parents = readshas(data, nparents, hashwidth);
632 if (parents == NULL) {
642 if (parents == NULL) {
633 goto bail;
643 goto bail;
634 }
644 }
635 data += nparents * hashwidth;
645 data += nparents * hashwidth;
636 } else {
646 } else {
637 parents = Py_None;
647 parents = Py_None;
638 Py_INCREF(parents);
648 Py_INCREF(parents);
639 }
649 }
640
650
641 if (data + 2 * nmetadata > dataend) {
651 if (data + 2 * nmetadata > dataend) {
642 goto overflow;
652 goto overflow;
643 }
653 }
644 meta = data + (2 * nmetadata);
654 meta = data + (2 * nmetadata);
645 metadata = PyTuple_New(nmetadata);
655 metadata = PyTuple_New(nmetadata);
646 if (metadata == NULL) {
656 if (metadata == NULL) {
647 goto bail;
657 goto bail;
648 }
658 }
649 for (i = 0; i < nmetadata; i++) {
659 for (i = 0; i < nmetadata; i++) {
650 PyObject *tmp, *left = NULL, *right = NULL;
660 PyObject *tmp, *left = NULL, *right = NULL;
651 Py_ssize_t leftsize = (unsigned char)(*data++);
661 Py_ssize_t leftsize = (unsigned char)(*data++);
652 Py_ssize_t rightsize = (unsigned char)(*data++);
662 Py_ssize_t rightsize = (unsigned char)(*data++);
653 if (meta + leftsize + rightsize > dataend) {
663 if (meta + leftsize + rightsize > dataend) {
654 goto overflow;
664 goto overflow;
655 }
665 }
656 left = PyBytes_FromStringAndSize(meta, leftsize);
666 left = PyBytes_FromStringAndSize(meta, leftsize);
657 meta += leftsize;
667 meta += leftsize;
658 right = PyBytes_FromStringAndSize(meta, rightsize);
668 right = PyBytes_FromStringAndSize(meta, rightsize);
659 meta += rightsize;
669 meta += rightsize;
660 tmp = PyTuple_New(2);
670 tmp = PyTuple_New(2);
661 if (!left || !right || !tmp) {
671 if (!left || !right || !tmp) {
662 Py_XDECREF(left);
672 Py_XDECREF(left);
663 Py_XDECREF(right);
673 Py_XDECREF(right);
664 Py_XDECREF(tmp);
674 Py_XDECREF(tmp);
665 goto bail;
675 goto bail;
666 }
676 }
667 PyTuple_SET_ITEM(tmp, 0, left);
677 PyTuple_SET_ITEM(tmp, 0, left);
668 PyTuple_SET_ITEM(tmp, 1, right);
678 PyTuple_SET_ITEM(tmp, 1, right);
669 PyTuple_SET_ITEM(metadata, i, tmp);
679 PyTuple_SET_ITEM(metadata, i, tmp);
670 }
680 }
671 ret = Py_BuildValue("(OOHO(di)O)", prec, succs, flags, metadata, mtime,
681 ret = Py_BuildValue("(OOHO(di)O)", prec, succs, flags, metadata, mtime,
672 (int)tz * 60, parents);
682 (int)tz * 60, parents);
673 goto bail; /* return successfully */
683 goto bail; /* return successfully */
674
684
675 overflow:
685 overflow:
676 PyErr_SetString(PyExc_ValueError, "overflow in obsstore");
686 PyErr_SetString(PyExc_ValueError, "overflow in obsstore");
677 bail:
687 bail:
678 Py_XDECREF(prec);
688 Py_XDECREF(prec);
679 Py_XDECREF(succs);
689 Py_XDECREF(succs);
680 Py_XDECREF(metadata);
690 Py_XDECREF(metadata);
681 Py_XDECREF(parents);
691 Py_XDECREF(parents);
682 return ret;
692 return ret;
683 }
693 }
684
694
685 static PyObject *fm1readmarkers(PyObject *self, PyObject *args)
695 static PyObject *fm1readmarkers(PyObject *self, PyObject *args)
686 {
696 {
687 const char *data, *dataend;
697 const char *data, *dataend;
688 Py_ssize_t datalen, offset, stop;
698 Py_ssize_t datalen, offset, stop;
689 PyObject *markers = NULL;
699 PyObject *markers = NULL;
690
700
691 if (!PyArg_ParseTuple(args, PY23("s#nn", "y#nn"), &data, &datalen,
701 if (!PyArg_ParseTuple(args, PY23("s#nn", "y#nn"), &data, &datalen,
692 &offset, &stop)) {
702 &offset, &stop)) {
693 return NULL;
703 return NULL;
694 }
704 }
695 if (offset < 0) {
705 if (offset < 0) {
696 PyErr_SetString(PyExc_ValueError,
706 PyErr_SetString(PyExc_ValueError,
697 "invalid negative offset in fm1readmarkers");
707 "invalid negative offset in fm1readmarkers");
698 return NULL;
708 return NULL;
699 }
709 }
700 if (stop > datalen) {
710 if (stop > datalen) {
701 PyErr_SetString(
711 PyErr_SetString(
702 PyExc_ValueError,
712 PyExc_ValueError,
703 "stop longer than data length in fm1readmarkers");
713 "stop longer than data length in fm1readmarkers");
704 return NULL;
714 return NULL;
705 }
715 }
706 dataend = data + datalen;
716 dataend = data + datalen;
707 data += offset;
717 data += offset;
708 markers = PyList_New(0);
718 markers = PyList_New(0);
709 if (!markers) {
719 if (!markers) {
710 return NULL;
720 return NULL;
711 }
721 }
712 while (offset < stop) {
722 while (offset < stop) {
713 uint32_t msize;
723 uint32_t msize;
714 int error;
724 int error;
715 PyObject *record = fm1readmarker(data, dataend, &msize);
725 PyObject *record = fm1readmarker(data, dataend, &msize);
716 if (!record) {
726 if (!record) {
717 goto bail;
727 goto bail;
718 }
728 }
719 error = PyList_Append(markers, record);
729 error = PyList_Append(markers, record);
720 Py_DECREF(record);
730 Py_DECREF(record);
721 if (error) {
731 if (error) {
722 goto bail;
732 goto bail;
723 }
733 }
724 data += msize;
734 data += msize;
725 offset += msize;
735 offset += msize;
726 }
736 }
727 return markers;
737 return markers;
728 bail:
738 bail:
729 Py_DECREF(markers);
739 Py_DECREF(markers);
730 return NULL;
740 return NULL;
731 }
741 }
732
742
733 static char parsers_doc[] = "Efficient content parsing.";
743 static char parsers_doc[] = "Efficient content parsing.";
734
744
735 PyObject *encodedir(PyObject *self, PyObject *args);
745 PyObject *encodedir(PyObject *self, PyObject *args);
736 PyObject *pathencode(PyObject *self, PyObject *args);
746 PyObject *pathencode(PyObject *self, PyObject *args);
737 PyObject *lowerencode(PyObject *self, PyObject *args);
747 PyObject *lowerencode(PyObject *self, PyObject *args);
738 PyObject *parse_index2(PyObject *self, PyObject *args, PyObject *kwargs);
748 PyObject *parse_index2(PyObject *self, PyObject *args, PyObject *kwargs);
739
749
740 static PyMethodDef methods[] = {
750 static PyMethodDef methods[] = {
741 {"pack_dirstate", pack_dirstate, METH_VARARGS, "pack a dirstate\n"},
751 {"pack_dirstate", pack_dirstate, METH_VARARGS, "pack a dirstate\n"},
742 {"nonnormalotherparententries", nonnormalotherparententries, METH_VARARGS,
752 {"nonnormalotherparententries", nonnormalotherparententries, METH_VARARGS,
743 "create a set containing non-normal and other parent entries of given "
753 "create a set containing non-normal and other parent entries of given "
744 "dirstate\n"},
754 "dirstate\n"},
745 {"parse_dirstate", parse_dirstate, METH_VARARGS, "parse a dirstate\n"},
755 {"parse_dirstate", parse_dirstate, METH_VARARGS, "parse a dirstate\n"},
746 {"parse_index2", (PyCFunction)parse_index2, METH_VARARGS | METH_KEYWORDS,
756 {"parse_index2", (PyCFunction)parse_index2, METH_VARARGS | METH_KEYWORDS,
747 "parse a revlog index\n"},
757 "parse a revlog index\n"},
748 {"isasciistr", isasciistr, METH_VARARGS, "check if an ASCII string\n"},
758 {"isasciistr", isasciistr, METH_VARARGS, "check if an ASCII string\n"},
749 {"asciilower", asciilower, METH_VARARGS, "lowercase an ASCII string\n"},
759 {"asciilower", asciilower, METH_VARARGS, "lowercase an ASCII string\n"},
750 {"asciiupper", asciiupper, METH_VARARGS, "uppercase an ASCII string\n"},
760 {"asciiupper", asciiupper, METH_VARARGS, "uppercase an ASCII string\n"},
751 {"dict_new_presized", dict_new_presized, METH_VARARGS,
761 {"dict_new_presized", dict_new_presized, METH_VARARGS,
752 "construct a dict with an expected size\n"},
762 "construct a dict with an expected size\n"},
753 {"make_file_foldmap", make_file_foldmap, METH_VARARGS,
763 {"make_file_foldmap", make_file_foldmap, METH_VARARGS,
754 "make file foldmap\n"},
764 "make file foldmap\n"},
755 {"jsonescapeu8fast", jsonescapeu8fast, METH_VARARGS,
765 {"jsonescapeu8fast", jsonescapeu8fast, METH_VARARGS,
756 "escape a UTF-8 byte string to JSON (fast path)\n"},
766 "escape a UTF-8 byte string to JSON (fast path)\n"},
757 {"encodedir", encodedir, METH_VARARGS, "encodedir a path\n"},
767 {"encodedir", encodedir, METH_VARARGS, "encodedir a path\n"},
758 {"pathencode", pathencode, METH_VARARGS, "fncache-encode a path\n"},
768 {"pathencode", pathencode, METH_VARARGS, "fncache-encode a path\n"},
759 {"lowerencode", lowerencode, METH_VARARGS, "lower-encode a path\n"},
769 {"lowerencode", lowerencode, METH_VARARGS, "lower-encode a path\n"},
760 {"fm1readmarkers", fm1readmarkers, METH_VARARGS,
770 {"fm1readmarkers", fm1readmarkers, METH_VARARGS,
761 "parse v1 obsolete markers\n"},
771 "parse v1 obsolete markers\n"},
762 {NULL, NULL}};
772 {NULL, NULL}};
763
773
764 void dirs_module_init(PyObject *mod);
774 void dirs_module_init(PyObject *mod);
765 void manifest_module_init(PyObject *mod);
775 void manifest_module_init(PyObject *mod);
766 void revlog_module_init(PyObject *mod);
776 void revlog_module_init(PyObject *mod);
767
777
768 static const int version = 20;
778 static const int version = 20;
769
779
770 static void module_init(PyObject *mod)
780 static void module_init(PyObject *mod)
771 {
781 {
772 PyObject *capsule = NULL;
782 PyObject *capsule = NULL;
773 PyModule_AddIntConstant(mod, "version", version);
783 PyModule_AddIntConstant(mod, "version", version);
774
784
775 /* This module constant has two purposes. First, it lets us unit test
785 /* This module constant has two purposes. First, it lets us unit test
776 * the ImportError raised without hard-coding any error text. This
786 * the ImportError raised without hard-coding any error text. This
777 * means we can change the text in the future without breaking tests,
787 * means we can change the text in the future without breaking tests,
778 * even across changesets without a recompile. Second, its presence
788 * even across changesets without a recompile. Second, its presence
779 * can be used to determine whether the version-checking logic is
789 * can be used to determine whether the version-checking logic is
780 * present, which also helps in testing across changesets without a
790 * present, which also helps in testing across changesets without a
781 * recompile. Note that this means the pure-Python version of parsers
791 * recompile. Note that this means the pure-Python version of parsers
782 * should not have this module constant. */
792 * should not have this module constant. */
783 PyModule_AddStringConstant(mod, "versionerrortext", versionerrortext);
793 PyModule_AddStringConstant(mod, "versionerrortext", versionerrortext);
784
794
785 dirs_module_init(mod);
795 dirs_module_init(mod);
786 manifest_module_init(mod);
796 manifest_module_init(mod);
787 revlog_module_init(mod);
797 revlog_module_init(mod);
788
798
789 capsule = PyCapsule_New(
799 capsule = PyCapsule_New(
790 make_dirstate_tuple,
800 make_dirstate_tuple,
791 "mercurial.cext.parsers.make_dirstate_tuple_CAPI", NULL);
801 "mercurial.cext.parsers.make_dirstate_tuple_CAPI", NULL);
792 if (capsule != NULL)
802 if (capsule != NULL)
793 PyModule_AddObject(mod, "make_dirstate_tuple_CAPI", capsule);
803 PyModule_AddObject(mod, "make_dirstate_tuple_CAPI", capsule);
794
804
795 if (PyType_Ready(&dirstateTupleType) < 0) {
805 if (PyType_Ready(&dirstateTupleType) < 0) {
796 return;
806 return;
797 }
807 }
798 Py_INCREF(&dirstateTupleType);
808 Py_INCREF(&dirstateTupleType);
799 PyModule_AddObject(mod, "dirstatetuple",
809 PyModule_AddObject(mod, "dirstatetuple",
800 (PyObject *)&dirstateTupleType);
810 (PyObject *)&dirstateTupleType);
801 }
811 }
802
812
803 static int check_python_version(void)
813 static int check_python_version(void)
804 {
814 {
805 PyObject *sys = PyImport_ImportModule("sys"), *ver;
815 PyObject *sys = PyImport_ImportModule("sys"), *ver;
806 long hexversion;
816 long hexversion;
807 if (!sys) {
817 if (!sys) {
808 return -1;
818 return -1;
809 }
819 }
810 ver = PyObject_GetAttrString(sys, "hexversion");
820 ver = PyObject_GetAttrString(sys, "hexversion");
811 Py_DECREF(sys);
821 Py_DECREF(sys);
812 if (!ver) {
822 if (!ver) {
813 return -1;
823 return -1;
814 }
824 }
815 hexversion = PyInt_AsLong(ver);
825 hexversion = PyInt_AsLong(ver);
816 Py_DECREF(ver);
826 Py_DECREF(ver);
817 /* sys.hexversion is a 32-bit number by default, so the -1 case
827 /* sys.hexversion is a 32-bit number by default, so the -1 case
818 * should only occur in unusual circumstances (e.g. if sys.hexversion
828 * should only occur in unusual circumstances (e.g. if sys.hexversion
819 * is manually set to an invalid value). */
829 * is manually set to an invalid value). */
820 if ((hexversion == -1) || (hexversion >> 16 != PY_VERSION_HEX >> 16)) {
830 if ((hexversion == -1) || (hexversion >> 16 != PY_VERSION_HEX >> 16)) {
821 PyErr_Format(PyExc_ImportError,
831 PyErr_Format(PyExc_ImportError,
822 "%s: The Mercurial extension "
832 "%s: The Mercurial extension "
823 "modules were compiled with Python " PY_VERSION
833 "modules were compiled with Python " PY_VERSION
824 ", but "
834 ", but "
825 "Mercurial is currently using Python with "
835 "Mercurial is currently using Python with "
826 "sys.hexversion=%ld: "
836 "sys.hexversion=%ld: "
827 "Python %s\n at: %s",
837 "Python %s\n at: %s",
828 versionerrortext, hexversion, Py_GetVersion(),
838 versionerrortext, hexversion, Py_GetVersion(),
829 Py_GetProgramFullPath());
839 Py_GetProgramFullPath());
830 return -1;
840 return -1;
831 }
841 }
832 return 0;
842 return 0;
833 }
843 }
834
844
835 #ifdef IS_PY3K
845 #ifdef IS_PY3K
836 static struct PyModuleDef parsers_module = {PyModuleDef_HEAD_INIT, "parsers",
846 static struct PyModuleDef parsers_module = {PyModuleDef_HEAD_INIT, "parsers",
837 parsers_doc, -1, methods};
847 parsers_doc, -1, methods};
838
848
839 PyMODINIT_FUNC PyInit_parsers(void)
849 PyMODINIT_FUNC PyInit_parsers(void)
840 {
850 {
841 PyObject *mod;
851 PyObject *mod;
842
852
843 if (check_python_version() == -1)
853 if (check_python_version() == -1)
844 return NULL;
854 return NULL;
845 mod = PyModule_Create(&parsers_module);
855 mod = PyModule_Create(&parsers_module);
846 module_init(mod);
856 module_init(mod);
847 return mod;
857 return mod;
848 }
858 }
849 #else
859 #else
850 PyMODINIT_FUNC initparsers(void)
860 PyMODINIT_FUNC initparsers(void)
851 {
861 {
852 PyObject *mod;
862 PyObject *mod;
853
863
854 if (check_python_version() == -1) {
864 if (check_python_version() == -1) {
855 return;
865 return;
856 }
866 }
857 mod = Py_InitModule3("parsers", methods, parsers_doc);
867 mod = Py_InitModule3("parsers", methods, parsers_doc);
858 module_init(mod);
868 module_init(mod);
859 }
869 }
860 #endif
870 #endif
@@ -1,1437 +1,1437 b''
1 # dirstate.py - working directory tracking for mercurial
1 # dirstate.py - working directory tracking for mercurial
2 #
2 #
3 # Copyright 2005-2007 Olivia Mackall <olivia@selenic.com>
3 # Copyright 2005-2007 Olivia Mackall <olivia@selenic.com>
4 #
4 #
5 # This software may be used and distributed according to the terms of the
5 # This software may be used and distributed according to the terms of the
6 # GNU General Public License version 2 or any later version.
6 # GNU General Public License version 2 or any later version.
7
7
8 from __future__ import absolute_import
8 from __future__ import absolute_import
9
9
10 import collections
10 import collections
11 import contextlib
11 import contextlib
12 import errno
12 import errno
13 import os
13 import os
14 import stat
14 import stat
15
15
16 from .i18n import _
16 from .i18n import _
17 from .pycompat import delattr
17 from .pycompat import delattr
18
18
19 from hgdemandimport import tracing
19 from hgdemandimport import tracing
20
20
21 from . import (
21 from . import (
22 dirstatemap,
22 dirstatemap,
23 encoding,
23 encoding,
24 error,
24 error,
25 match as matchmod,
25 match as matchmod,
26 pathutil,
26 pathutil,
27 policy,
27 policy,
28 pycompat,
28 pycompat,
29 scmutil,
29 scmutil,
30 sparse,
30 sparse,
31 util,
31 util,
32 )
32 )
33
33
34 from .interfaces import (
34 from .interfaces import (
35 dirstate as intdirstate,
35 dirstate as intdirstate,
36 util as interfaceutil,
36 util as interfaceutil,
37 )
37 )
38
38
39 parsers = policy.importmod('parsers')
39 parsers = policy.importmod('parsers')
40 rustmod = policy.importrust('dirstate')
40 rustmod = policy.importrust('dirstate')
41
41
42 SUPPORTS_DIRSTATE_V2 = rustmod is not None
42 SUPPORTS_DIRSTATE_V2 = rustmod is not None
43
43
44 propertycache = util.propertycache
44 propertycache = util.propertycache
45 filecache = scmutil.filecache
45 filecache = scmutil.filecache
46 _rangemask = dirstatemap.rangemask
46 _rangemask = dirstatemap.rangemask
47
47
48 dirstatetuple = parsers.dirstatetuple
48 dirstatetuple = parsers.dirstatetuple
49
49
50
50
51 class repocache(filecache):
51 class repocache(filecache):
52 """filecache for files in .hg/"""
52 """filecache for files in .hg/"""
53
53
54 def join(self, obj, fname):
54 def join(self, obj, fname):
55 return obj._opener.join(fname)
55 return obj._opener.join(fname)
56
56
57
57
58 class rootcache(filecache):
58 class rootcache(filecache):
59 """filecache for files in the repository root"""
59 """filecache for files in the repository root"""
60
60
61 def join(self, obj, fname):
61 def join(self, obj, fname):
62 return obj._join(fname)
62 return obj._join(fname)
63
63
64
64
65 def _getfsnow(vfs):
65 def _getfsnow(vfs):
66 '''Get "now" timestamp on filesystem'''
66 '''Get "now" timestamp on filesystem'''
67 tmpfd, tmpname = vfs.mkstemp()
67 tmpfd, tmpname = vfs.mkstemp()
68 try:
68 try:
69 return os.fstat(tmpfd)[stat.ST_MTIME]
69 return os.fstat(tmpfd)[stat.ST_MTIME]
70 finally:
70 finally:
71 os.close(tmpfd)
71 os.close(tmpfd)
72 vfs.unlink(tmpname)
72 vfs.unlink(tmpname)
73
73
74
74
75 @interfaceutil.implementer(intdirstate.idirstate)
75 @interfaceutil.implementer(intdirstate.idirstate)
76 class dirstate(object):
76 class dirstate(object):
77 def __init__(
77 def __init__(
78 self,
78 self,
79 opener,
79 opener,
80 ui,
80 ui,
81 root,
81 root,
82 validate,
82 validate,
83 sparsematchfn,
83 sparsematchfn,
84 nodeconstants,
84 nodeconstants,
85 use_dirstate_v2,
85 use_dirstate_v2,
86 ):
86 ):
87 """Create a new dirstate object.
87 """Create a new dirstate object.
88
88
89 opener is an open()-like callable that can be used to open the
89 opener is an open()-like callable that can be used to open the
90 dirstate file; root is the root of the directory tracked by
90 dirstate file; root is the root of the directory tracked by
91 the dirstate.
91 the dirstate.
92 """
92 """
93 self._use_dirstate_v2 = use_dirstate_v2
93 self._use_dirstate_v2 = use_dirstate_v2
94 self._nodeconstants = nodeconstants
94 self._nodeconstants = nodeconstants
95 self._opener = opener
95 self._opener = opener
96 self._validate = validate
96 self._validate = validate
97 self._root = root
97 self._root = root
98 self._sparsematchfn = sparsematchfn
98 self._sparsematchfn = sparsematchfn
99 # ntpath.join(root, '') of Python 2.7.9 does not add sep if root is
99 # ntpath.join(root, '') of Python 2.7.9 does not add sep if root is
100 # UNC path pointing to root share (issue4557)
100 # UNC path pointing to root share (issue4557)
101 self._rootdir = pathutil.normasprefix(root)
101 self._rootdir = pathutil.normasprefix(root)
102 self._dirty = False
102 self._dirty = False
103 self._lastnormaltime = 0
103 self._lastnormaltime = 0
104 self._ui = ui
104 self._ui = ui
105 self._filecache = {}
105 self._filecache = {}
106 self._parentwriters = 0
106 self._parentwriters = 0
107 self._filename = b'dirstate'
107 self._filename = b'dirstate'
108 self._pendingfilename = b'%s.pending' % self._filename
108 self._pendingfilename = b'%s.pending' % self._filename
109 self._plchangecallbacks = {}
109 self._plchangecallbacks = {}
110 self._origpl = None
110 self._origpl = None
111 self._updatedfiles = set()
111 self._updatedfiles = set()
112 self._mapcls = dirstatemap.dirstatemap
112 self._mapcls = dirstatemap.dirstatemap
113 # Access and cache cwd early, so we don't access it for the first time
113 # Access and cache cwd early, so we don't access it for the first time
114 # after a working-copy update caused it to not exist (accessing it then
114 # after a working-copy update caused it to not exist (accessing it then
115 # raises an exception).
115 # raises an exception).
116 self._cwd
116 self._cwd
117
117
118 def prefetch_parents(self):
118 def prefetch_parents(self):
119 """make sure the parents are loaded
119 """make sure the parents are loaded
120
120
121 Used to avoid a race condition.
121 Used to avoid a race condition.
122 """
122 """
123 self._pl
123 self._pl
124
124
125 @contextlib.contextmanager
125 @contextlib.contextmanager
126 def parentchange(self):
126 def parentchange(self):
127 """Context manager for handling dirstate parents.
127 """Context manager for handling dirstate parents.
128
128
129 If an exception occurs in the scope of the context manager,
129 If an exception occurs in the scope of the context manager,
130 the incoherent dirstate won't be written when wlock is
130 the incoherent dirstate won't be written when wlock is
131 released.
131 released.
132 """
132 """
133 self._parentwriters += 1
133 self._parentwriters += 1
134 yield
134 yield
135 # Typically we want the "undo" step of a context manager in a
135 # Typically we want the "undo" step of a context manager in a
136 # finally block so it happens even when an exception
136 # finally block so it happens even when an exception
137 # occurs. In this case, however, we only want to decrement
137 # occurs. In this case, however, we only want to decrement
138 # parentwriters if the code in the with statement exits
138 # parentwriters if the code in the with statement exits
139 # normally, so we don't have a try/finally here on purpose.
139 # normally, so we don't have a try/finally here on purpose.
140 self._parentwriters -= 1
140 self._parentwriters -= 1
141
141
142 def pendingparentchange(self):
142 def pendingparentchange(self):
143 """Returns true if the dirstate is in the middle of a set of changes
143 """Returns true if the dirstate is in the middle of a set of changes
144 that modify the dirstate parent.
144 that modify the dirstate parent.
145 """
145 """
146 return self._parentwriters > 0
146 return self._parentwriters > 0
147
147
148 @propertycache
148 @propertycache
149 def _map(self):
149 def _map(self):
150 """Return the dirstate contents (see documentation for dirstatemap)."""
150 """Return the dirstate contents (see documentation for dirstatemap)."""
151 self._map = self._mapcls(
151 self._map = self._mapcls(
152 self._ui,
152 self._ui,
153 self._opener,
153 self._opener,
154 self._root,
154 self._root,
155 self._nodeconstants,
155 self._nodeconstants,
156 self._use_dirstate_v2,
156 self._use_dirstate_v2,
157 )
157 )
158 return self._map
158 return self._map
159
159
160 @property
160 @property
161 def _sparsematcher(self):
161 def _sparsematcher(self):
162 """The matcher for the sparse checkout.
162 """The matcher for the sparse checkout.
163
163
164 The working directory may not include every file from a manifest. The
164 The working directory may not include every file from a manifest. The
165 matcher obtained by this property will match a path if it is to be
165 matcher obtained by this property will match a path if it is to be
166 included in the working directory.
166 included in the working directory.
167 """
167 """
168 # TODO there is potential to cache this property. For now, the matcher
168 # TODO there is potential to cache this property. For now, the matcher
169 # is resolved on every access. (But the called function does use a
169 # is resolved on every access. (But the called function does use a
170 # cache to keep the lookup fast.)
170 # cache to keep the lookup fast.)
171 return self._sparsematchfn()
171 return self._sparsematchfn()
172
172
173 @repocache(b'branch')
173 @repocache(b'branch')
174 def _branch(self):
174 def _branch(self):
175 try:
175 try:
176 return self._opener.read(b"branch").strip() or b"default"
176 return self._opener.read(b"branch").strip() or b"default"
177 except IOError as inst:
177 except IOError as inst:
178 if inst.errno != errno.ENOENT:
178 if inst.errno != errno.ENOENT:
179 raise
179 raise
180 return b"default"
180 return b"default"
181
181
182 @property
182 @property
183 def _pl(self):
183 def _pl(self):
184 return self._map.parents()
184 return self._map.parents()
185
185
186 def hasdir(self, d):
186 def hasdir(self, d):
187 return self._map.hastrackeddir(d)
187 return self._map.hastrackeddir(d)
188
188
189 @rootcache(b'.hgignore')
189 @rootcache(b'.hgignore')
190 def _ignore(self):
190 def _ignore(self):
191 files = self._ignorefiles()
191 files = self._ignorefiles()
192 if not files:
192 if not files:
193 return matchmod.never()
193 return matchmod.never()
194
194
195 pats = [b'include:%s' % f for f in files]
195 pats = [b'include:%s' % f for f in files]
196 return matchmod.match(self._root, b'', [], pats, warn=self._ui.warn)
196 return matchmod.match(self._root, b'', [], pats, warn=self._ui.warn)
197
197
198 @propertycache
198 @propertycache
199 def _slash(self):
199 def _slash(self):
200 return self._ui.configbool(b'ui', b'slash') and pycompat.ossep != b'/'
200 return self._ui.configbool(b'ui', b'slash') and pycompat.ossep != b'/'
201
201
202 @propertycache
202 @propertycache
203 def _checklink(self):
203 def _checklink(self):
204 return util.checklink(self._root)
204 return util.checklink(self._root)
205
205
206 @propertycache
206 @propertycache
207 def _checkexec(self):
207 def _checkexec(self):
208 return bool(util.checkexec(self._root))
208 return bool(util.checkexec(self._root))
209
209
210 @propertycache
210 @propertycache
211 def _checkcase(self):
211 def _checkcase(self):
212 return not util.fscasesensitive(self._join(b'.hg'))
212 return not util.fscasesensitive(self._join(b'.hg'))
213
213
214 def _join(self, f):
214 def _join(self, f):
215 # much faster than os.path.join()
215 # much faster than os.path.join()
216 # it's safe because f is always a relative path
216 # it's safe because f is always a relative path
217 return self._rootdir + f
217 return self._rootdir + f
218
218
219 def flagfunc(self, buildfallback):
219 def flagfunc(self, buildfallback):
220 if self._checklink and self._checkexec:
220 if self._checklink and self._checkexec:
221
221
222 def f(x):
222 def f(x):
223 try:
223 try:
224 st = os.lstat(self._join(x))
224 st = os.lstat(self._join(x))
225 if util.statislink(st):
225 if util.statislink(st):
226 return b'l'
226 return b'l'
227 if util.statisexec(st):
227 if util.statisexec(st):
228 return b'x'
228 return b'x'
229 except OSError:
229 except OSError:
230 pass
230 pass
231 return b''
231 return b''
232
232
233 return f
233 return f
234
234
235 fallback = buildfallback()
235 fallback = buildfallback()
236 if self._checklink:
236 if self._checklink:
237
237
238 def f(x):
238 def f(x):
239 if os.path.islink(self._join(x)):
239 if os.path.islink(self._join(x)):
240 return b'l'
240 return b'l'
241 if b'x' in fallback(x):
241 if b'x' in fallback(x):
242 return b'x'
242 return b'x'
243 return b''
243 return b''
244
244
245 return f
245 return f
246 if self._checkexec:
246 if self._checkexec:
247
247
248 def f(x):
248 def f(x):
249 if b'l' in fallback(x):
249 if b'l' in fallback(x):
250 return b'l'
250 return b'l'
251 if util.isexec(self._join(x)):
251 if util.isexec(self._join(x)):
252 return b'x'
252 return b'x'
253 return b''
253 return b''
254
254
255 return f
255 return f
256 else:
256 else:
257 return fallback
257 return fallback
258
258
259 @propertycache
259 @propertycache
260 def _cwd(self):
260 def _cwd(self):
261 # internal config: ui.forcecwd
261 # internal config: ui.forcecwd
262 forcecwd = self._ui.config(b'ui', b'forcecwd')
262 forcecwd = self._ui.config(b'ui', b'forcecwd')
263 if forcecwd:
263 if forcecwd:
264 return forcecwd
264 return forcecwd
265 return encoding.getcwd()
265 return encoding.getcwd()
266
266
267 def getcwd(self):
267 def getcwd(self):
268 """Return the path from which a canonical path is calculated.
268 """Return the path from which a canonical path is calculated.
269
269
270 This path should be used to resolve file patterns or to convert
270 This path should be used to resolve file patterns or to convert
271 canonical paths back to file paths for display. It shouldn't be
271 canonical paths back to file paths for display. It shouldn't be
272 used to get real file paths. Use vfs functions instead.
272 used to get real file paths. Use vfs functions instead.
273 """
273 """
274 cwd = self._cwd
274 cwd = self._cwd
275 if cwd == self._root:
275 if cwd == self._root:
276 return b''
276 return b''
277 # self._root ends with a path separator if self._root is '/' or 'C:\'
277 # self._root ends with a path separator if self._root is '/' or 'C:\'
278 rootsep = self._root
278 rootsep = self._root
279 if not util.endswithsep(rootsep):
279 if not util.endswithsep(rootsep):
280 rootsep += pycompat.ossep
280 rootsep += pycompat.ossep
281 if cwd.startswith(rootsep):
281 if cwd.startswith(rootsep):
282 return cwd[len(rootsep) :]
282 return cwd[len(rootsep) :]
283 else:
283 else:
284 # we're outside the repo. return an absolute path.
284 # we're outside the repo. return an absolute path.
285 return cwd
285 return cwd
286
286
287 def pathto(self, f, cwd=None):
287 def pathto(self, f, cwd=None):
288 if cwd is None:
288 if cwd is None:
289 cwd = self.getcwd()
289 cwd = self.getcwd()
290 path = util.pathto(self._root, cwd, f)
290 path = util.pathto(self._root, cwd, f)
291 if self._slash:
291 if self._slash:
292 return util.pconvert(path)
292 return util.pconvert(path)
293 return path
293 return path
294
294
295 def __getitem__(self, key):
295 def __getitem__(self, key):
296 """Return the current state of key (a filename) in the dirstate.
296 """Return the current state of key (a filename) in the dirstate.
297
297
298 States are:
298 States are:
299 n normal
299 n normal
300 m needs merging
300 m needs merging
301 r marked for removal
301 r marked for removal
302 a marked for addition
302 a marked for addition
303 ? not tracked
303 ? not tracked
304
304
305 XXX The "state" is a bit obscure to be in the "public" API. we should
305 XXX The "state" is a bit obscure to be in the "public" API. we should
306 consider migrating all user of this to going through the dirstate entry
306 consider migrating all user of this to going through the dirstate entry
307 instead.
307 instead.
308 """
308 """
309 entry = self._map.get(key)
309 entry = self._map.get(key)
310 if entry is not None:
310 if entry is not None:
311 return entry.state
311 return entry.state
312 return b'?'
312 return b'?'
313
313
314 def __contains__(self, key):
314 def __contains__(self, key):
315 return key in self._map
315 return key in self._map
316
316
317 def __iter__(self):
317 def __iter__(self):
318 return iter(sorted(self._map))
318 return iter(sorted(self._map))
319
319
320 def items(self):
320 def items(self):
321 return pycompat.iteritems(self._map)
321 return pycompat.iteritems(self._map)
322
322
323 iteritems = items
323 iteritems = items
324
324
325 def directories(self):
325 def directories(self):
326 return self._map.directories()
326 return self._map.directories()
327
327
328 def parents(self):
328 def parents(self):
329 return [self._validate(p) for p in self._pl]
329 return [self._validate(p) for p in self._pl]
330
330
331 def p1(self):
331 def p1(self):
332 return self._validate(self._pl[0])
332 return self._validate(self._pl[0])
333
333
334 def p2(self):
334 def p2(self):
335 return self._validate(self._pl[1])
335 return self._validate(self._pl[1])
336
336
337 @property
337 @property
338 def in_merge(self):
338 def in_merge(self):
339 """True if a merge is in progress"""
339 """True if a merge is in progress"""
340 return self._pl[1] != self._nodeconstants.nullid
340 return self._pl[1] != self._nodeconstants.nullid
341
341
342 def branch(self):
342 def branch(self):
343 return encoding.tolocal(self._branch)
343 return encoding.tolocal(self._branch)
344
344
345 def setparents(self, p1, p2=None):
345 def setparents(self, p1, p2=None):
346 """Set dirstate parents to p1 and p2.
346 """Set dirstate parents to p1 and p2.
347
347
348 When moving from two parents to one, "merged" entries a
348 When moving from two parents to one, "merged" entries a
349 adjusted to normal and previous copy records discarded and
349 adjusted to normal and previous copy records discarded and
350 returned by the call.
350 returned by the call.
351
351
352 See localrepo.setparents()
352 See localrepo.setparents()
353 """
353 """
354 if p2 is None:
354 if p2 is None:
355 p2 = self._nodeconstants.nullid
355 p2 = self._nodeconstants.nullid
356 if self._parentwriters == 0:
356 if self._parentwriters == 0:
357 raise ValueError(
357 raise ValueError(
358 b"cannot set dirstate parent outside of "
358 b"cannot set dirstate parent outside of "
359 b"dirstate.parentchange context manager"
359 b"dirstate.parentchange context manager"
360 )
360 )
361
361
362 self._dirty = True
362 self._dirty = True
363 oldp2 = self._pl[1]
363 oldp2 = self._pl[1]
364 if self._origpl is None:
364 if self._origpl is None:
365 self._origpl = self._pl
365 self._origpl = self._pl
366 self._map.setparents(p1, p2)
366 self._map.setparents(p1, p2)
367 copies = {}
367 copies = {}
368 if (
368 if (
369 oldp2 != self._nodeconstants.nullid
369 oldp2 != self._nodeconstants.nullid
370 and p2 == self._nodeconstants.nullid
370 and p2 == self._nodeconstants.nullid
371 ):
371 ):
372 candidatefiles = self._map.non_normal_or_other_parent_paths()
372 candidatefiles = self._map.non_normal_or_other_parent_paths()
373
373
374 for f in candidatefiles:
374 for f in candidatefiles:
375 s = self._map.get(f)
375 s = self._map.get(f)
376 if s is None:
376 if s is None:
377 continue
377 continue
378
378
379 # Discard "merged" markers when moving away from a merge state
379 # Discard "merged" markers when moving away from a merge state
380 if s.merged:
380 if s.merged:
381 source = self._map.copymap.get(f)
381 source = self._map.copymap.get(f)
382 if source:
382 if source:
383 copies[f] = source
383 copies[f] = source
384 self.normallookup(f)
384 self.normallookup(f)
385 # Also fix up otherparent markers
385 # Also fix up otherparent markers
386 elif s.from_p2:
386 elif s.from_p2:
387 source = self._map.copymap.get(f)
387 source = self._map.copymap.get(f)
388 if source:
388 if source:
389 copies[f] = source
389 copies[f] = source
390 self.add(f)
390 self.add(f)
391 return copies
391 return copies
392
392
393 def setbranch(self, branch):
393 def setbranch(self, branch):
394 self.__class__._branch.set(self, encoding.fromlocal(branch))
394 self.__class__._branch.set(self, encoding.fromlocal(branch))
395 f = self._opener(b'branch', b'w', atomictemp=True, checkambig=True)
395 f = self._opener(b'branch', b'w', atomictemp=True, checkambig=True)
396 try:
396 try:
397 f.write(self._branch + b'\n')
397 f.write(self._branch + b'\n')
398 f.close()
398 f.close()
399
399
400 # make sure filecache has the correct stat info for _branch after
400 # make sure filecache has the correct stat info for _branch after
401 # replacing the underlying file
401 # replacing the underlying file
402 ce = self._filecache[b'_branch']
402 ce = self._filecache[b'_branch']
403 if ce:
403 if ce:
404 ce.refresh()
404 ce.refresh()
405 except: # re-raises
405 except: # re-raises
406 f.discard()
406 f.discard()
407 raise
407 raise
408
408
409 def invalidate(self):
409 def invalidate(self):
410 """Causes the next access to reread the dirstate.
410 """Causes the next access to reread the dirstate.
411
411
412 This is different from localrepo.invalidatedirstate() because it always
412 This is different from localrepo.invalidatedirstate() because it always
413 rereads the dirstate. Use localrepo.invalidatedirstate() if you want to
413 rereads the dirstate. Use localrepo.invalidatedirstate() if you want to
414 check whether the dirstate has changed before rereading it."""
414 check whether the dirstate has changed before rereading it."""
415
415
416 for a in ("_map", "_branch", "_ignore"):
416 for a in ("_map", "_branch", "_ignore"):
417 if a in self.__dict__:
417 if a in self.__dict__:
418 delattr(self, a)
418 delattr(self, a)
419 self._lastnormaltime = 0
419 self._lastnormaltime = 0
420 self._dirty = False
420 self._dirty = False
421 self._updatedfiles.clear()
421 self._updatedfiles.clear()
422 self._parentwriters = 0
422 self._parentwriters = 0
423 self._origpl = None
423 self._origpl = None
424
424
425 def copy(self, source, dest):
425 def copy(self, source, dest):
426 """Mark dest as a copy of source. Unmark dest if source is None."""
426 """Mark dest as a copy of source. Unmark dest if source is None."""
427 if source == dest:
427 if source == dest:
428 return
428 return
429 self._dirty = True
429 self._dirty = True
430 if source is not None:
430 if source is not None:
431 self._map.copymap[dest] = source
431 self._map.copymap[dest] = source
432 self._updatedfiles.add(source)
432 self._updatedfiles.add(source)
433 self._updatedfiles.add(dest)
433 self._updatedfiles.add(dest)
434 elif self._map.copymap.pop(dest, None):
434 elif self._map.copymap.pop(dest, None):
435 self._updatedfiles.add(dest)
435 self._updatedfiles.add(dest)
436
436
437 def copied(self, file):
437 def copied(self, file):
438 return self._map.copymap.get(file, None)
438 return self._map.copymap.get(file, None)
439
439
440 def copies(self):
440 def copies(self):
441 return self._map.copymap
441 return self._map.copymap
442
442
443 def _addpath(
443 def _addpath(
444 self,
444 self,
445 f,
445 f,
446 state=None,
446 state=None,
447 mode=0,
447 mode=0,
448 size=None,
448 size=None,
449 mtime=None,
449 mtime=None,
450 added=False,
450 added=False,
451 from_p2=False,
451 from_p2=False,
452 possibly_dirty=False,
452 possibly_dirty=False,
453 ):
453 ):
454 entry = self._map.get(f)
454 entry = self._map.get(f)
455 if added or entry is not None and entry.removed:
455 if added or entry is not None and entry.removed:
456 scmutil.checkfilename(f)
456 scmutil.checkfilename(f)
457 if self._map.hastrackeddir(f):
457 if self._map.hastrackeddir(f):
458 msg = _(b'directory %r already in dirstate')
458 msg = _(b'directory %r already in dirstate')
459 msg %= pycompat.bytestr(f)
459 msg %= pycompat.bytestr(f)
460 raise error.Abort(msg)
460 raise error.Abort(msg)
461 # shadows
461 # shadows
462 for d in pathutil.finddirs(f):
462 for d in pathutil.finddirs(f):
463 if self._map.hastrackeddir(d):
463 if self._map.hastrackeddir(d):
464 break
464 break
465 entry = self._map.get(d)
465 entry = self._map.get(d)
466 if entry is not None and not entry.removed:
466 if entry is not None and not entry.removed:
467 msg = _(b'file %r in dirstate clashes with %r')
467 msg = _(b'file %r in dirstate clashes with %r')
468 msg %= (pycompat.bytestr(d), pycompat.bytestr(f))
468 msg %= (pycompat.bytestr(d), pycompat.bytestr(f))
469 raise error.Abort(msg)
469 raise error.Abort(msg)
470 self._dirty = True
470 self._dirty = True
471 self._updatedfiles.add(f)
471 self._updatedfiles.add(f)
472 self._map.addfile(
472 self._map.addfile(
473 f,
473 f,
474 state=state,
474 state=state,
475 mode=mode,
475 mode=mode,
476 size=size,
476 size=size,
477 mtime=mtime,
477 mtime=mtime,
478 added=added,
478 added=added,
479 from_p2=from_p2,
479 from_p2=from_p2,
480 possibly_dirty=possibly_dirty,
480 possibly_dirty=possibly_dirty,
481 )
481 )
482
482
483 def normal(self, f, parentfiledata=None):
483 def normal(self, f, parentfiledata=None):
484 """Mark a file normal and clean.
484 """Mark a file normal and clean.
485
485
486 parentfiledata: (mode, size, mtime) of the clean file
486 parentfiledata: (mode, size, mtime) of the clean file
487
487
488 parentfiledata should be computed from memory (for mode,
488 parentfiledata should be computed from memory (for mode,
489 size), as or close as possible from the point where we
489 size), as or close as possible from the point where we
490 determined the file was clean, to limit the risk of the
490 determined the file was clean, to limit the risk of the
491 file having been changed by an external process between the
491 file having been changed by an external process between the
492 moment where the file was determined to be clean and now."""
492 moment where the file was determined to be clean and now."""
493 if parentfiledata:
493 if parentfiledata:
494 (mode, size, mtime) = parentfiledata
494 (mode, size, mtime) = parentfiledata
495 else:
495 else:
496 s = os.lstat(self._join(f))
496 s = os.lstat(self._join(f))
497 mode = s.st_mode
497 mode = s.st_mode
498 size = s.st_size
498 size = s.st_size
499 mtime = s[stat.ST_MTIME]
499 mtime = s[stat.ST_MTIME]
500 self._addpath(f, b'n', mode, size, mtime)
500 self._addpath(f, b'n', mode, size, mtime)
501 self._map.copymap.pop(f, None)
501 self._map.copymap.pop(f, None)
502 if f in self._map.nonnormalset:
502 if f in self._map.nonnormalset:
503 self._map.nonnormalset.remove(f)
503 self._map.nonnormalset.remove(f)
504 if mtime > self._lastnormaltime:
504 if mtime > self._lastnormaltime:
505 # Remember the most recent modification timeslot for status(),
505 # Remember the most recent modification timeslot for status(),
506 # to make sure we won't miss future size-preserving file content
506 # to make sure we won't miss future size-preserving file content
507 # modifications that happen within the same timeslot.
507 # modifications that happen within the same timeslot.
508 self._lastnormaltime = mtime
508 self._lastnormaltime = mtime
509
509
510 def normallookup(self, f):
510 def normallookup(self, f):
511 '''Mark a file normal, but possibly dirty.'''
511 '''Mark a file normal, but possibly dirty.'''
512 if self.in_merge:
512 if self.in_merge:
513 # if there is a merge going on and the file was either
513 # if there is a merge going on and the file was either
514 # "merged" or coming from other parent (-2) before
514 # "merged" or coming from other parent (-2) before
515 # being removed, restore that state.
515 # being removed, restore that state.
516 entry = self._map.get(f)
516 entry = self._map.get(f)
517 if entry is not None:
517 if entry is not None:
518 # XXX this should probably be dealt with a a lower level
518 # XXX this should probably be dealt with a a lower level
519 # (see `merged_removed` and `from_p2_removed`)
519 # (see `merged_removed` and `from_p2_removed`)
520 if entry.merged_removed or entry.from_p2_removed:
520 if entry.merged_removed or entry.from_p2_removed:
521 source = self._map.copymap.get(f)
521 source = self._map.copymap.get(f)
522 if entry.merged_removed:
522 if entry.merged_removed:
523 self.merge(f)
523 self.merge(f)
524 elif entry.from_p2_removed:
524 elif entry.from_p2_removed:
525 self.otherparent(f)
525 self.otherparent(f)
526 if source is not None:
526 if source is not None:
527 self.copy(source, f)
527 self.copy(source, f)
528 return
528 return
529 elif entry.merged or entry.from_p2:
529 elif entry.merged or entry.from_p2:
530 return
530 return
531 self._addpath(f, b'n', 0, possibly_dirty=True)
531 self._addpath(f, b'n', 0, possibly_dirty=True)
532 self._map.copymap.pop(f, None)
532 self._map.copymap.pop(f, None)
533
533
534 def otherparent(self, f):
534 def otherparent(self, f):
535 '''Mark as coming from the other parent, always dirty.'''
535 '''Mark as coming from the other parent, always dirty.'''
536 if not self.in_merge:
536 if not self.in_merge:
537 msg = _(b"setting %r to other parent only allowed in merges") % f
537 msg = _(b"setting %r to other parent only allowed in merges") % f
538 raise error.Abort(msg)
538 raise error.Abort(msg)
539 if f in self and self[f] == b'n':
539 if f in self and self[f] == b'n':
540 # merge-like
540 # merge-like
541 self._addpath(f, b'm', 0, from_p2=True)
541 self._addpath(f, b'm', 0, from_p2=True)
542 else:
542 else:
543 # add-like
543 # add-like
544 self._addpath(f, b'n', 0, from_p2=True)
544 self._addpath(f, b'n', 0, from_p2=True)
545 self._map.copymap.pop(f, None)
545 self._map.copymap.pop(f, None)
546
546
547 def add(self, f):
547 def add(self, f):
548 '''Mark a file added.'''
548 '''Mark a file added.'''
549 self._addpath(f, added=True)
549 self._addpath(f, added=True)
550 self._map.copymap.pop(f, None)
550 self._map.copymap.pop(f, None)
551
551
552 def remove(self, f):
552 def remove(self, f):
553 '''Mark a file removed.'''
553 '''Mark a file removed.'''
554 self._dirty = True
554 self._dirty = True
555 self._updatedfiles.add(f)
555 self._updatedfiles.add(f)
556 self._map.removefile(f, in_merge=self.in_merge)
556 self._map.removefile(f, in_merge=self.in_merge)
557
557
558 def merge(self, f):
558 def merge(self, f):
559 '''Mark a file merged.'''
559 '''Mark a file merged.'''
560 if not self.in_merge:
560 if not self.in_merge:
561 return self.normallookup(f)
561 return self.normallookup(f)
562 return self.otherparent(f)
562 return self.otherparent(f)
563
563
564 def drop(self, f):
564 def drop(self, f):
565 '''Drop a file from the dirstate'''
565 '''Drop a file from the dirstate'''
566 oldstate = self[f]
566 oldstate = self[f]
567 if self._map.dropfile(f, oldstate):
567 if self._map.dropfile(f, oldstate):
568 self._dirty = True
568 self._dirty = True
569 self._updatedfiles.add(f)
569 self._updatedfiles.add(f)
570 self._map.copymap.pop(f, None)
570 self._map.copymap.pop(f, None)
571
571
572 def _discoverpath(self, path, normed, ignoremissing, exists, storemap):
572 def _discoverpath(self, path, normed, ignoremissing, exists, storemap):
573 if exists is None:
573 if exists is None:
574 exists = os.path.lexists(os.path.join(self._root, path))
574 exists = os.path.lexists(os.path.join(self._root, path))
575 if not exists:
575 if not exists:
576 # Maybe a path component exists
576 # Maybe a path component exists
577 if not ignoremissing and b'/' in path:
577 if not ignoremissing and b'/' in path:
578 d, f = path.rsplit(b'/', 1)
578 d, f = path.rsplit(b'/', 1)
579 d = self._normalize(d, False, ignoremissing, None)
579 d = self._normalize(d, False, ignoremissing, None)
580 folded = d + b"/" + f
580 folded = d + b"/" + f
581 else:
581 else:
582 # No path components, preserve original case
582 # No path components, preserve original case
583 folded = path
583 folded = path
584 else:
584 else:
585 # recursively normalize leading directory components
585 # recursively normalize leading directory components
586 # against dirstate
586 # against dirstate
587 if b'/' in normed:
587 if b'/' in normed:
588 d, f = normed.rsplit(b'/', 1)
588 d, f = normed.rsplit(b'/', 1)
589 d = self._normalize(d, False, ignoremissing, True)
589 d = self._normalize(d, False, ignoremissing, True)
590 r = self._root + b"/" + d
590 r = self._root + b"/" + d
591 folded = d + b"/" + util.fspath(f, r)
591 folded = d + b"/" + util.fspath(f, r)
592 else:
592 else:
593 folded = util.fspath(normed, self._root)
593 folded = util.fspath(normed, self._root)
594 storemap[normed] = folded
594 storemap[normed] = folded
595
595
596 return folded
596 return folded
597
597
598 def _normalizefile(self, path, isknown, ignoremissing=False, exists=None):
598 def _normalizefile(self, path, isknown, ignoremissing=False, exists=None):
599 normed = util.normcase(path)
599 normed = util.normcase(path)
600 folded = self._map.filefoldmap.get(normed, None)
600 folded = self._map.filefoldmap.get(normed, None)
601 if folded is None:
601 if folded is None:
602 if isknown:
602 if isknown:
603 folded = path
603 folded = path
604 else:
604 else:
605 folded = self._discoverpath(
605 folded = self._discoverpath(
606 path, normed, ignoremissing, exists, self._map.filefoldmap
606 path, normed, ignoremissing, exists, self._map.filefoldmap
607 )
607 )
608 return folded
608 return folded
609
609
610 def _normalize(self, path, isknown, ignoremissing=False, exists=None):
610 def _normalize(self, path, isknown, ignoremissing=False, exists=None):
611 normed = util.normcase(path)
611 normed = util.normcase(path)
612 folded = self._map.filefoldmap.get(normed, None)
612 folded = self._map.filefoldmap.get(normed, None)
613 if folded is None:
613 if folded is None:
614 folded = self._map.dirfoldmap.get(normed, None)
614 folded = self._map.dirfoldmap.get(normed, None)
615 if folded is None:
615 if folded is None:
616 if isknown:
616 if isknown:
617 folded = path
617 folded = path
618 else:
618 else:
619 # store discovered result in dirfoldmap so that future
619 # store discovered result in dirfoldmap so that future
620 # normalizefile calls don't start matching directories
620 # normalizefile calls don't start matching directories
621 folded = self._discoverpath(
621 folded = self._discoverpath(
622 path, normed, ignoremissing, exists, self._map.dirfoldmap
622 path, normed, ignoremissing, exists, self._map.dirfoldmap
623 )
623 )
624 return folded
624 return folded
625
625
626 def normalize(self, path, isknown=False, ignoremissing=False):
626 def normalize(self, path, isknown=False, ignoremissing=False):
627 """
627 """
628 normalize the case of a pathname when on a casefolding filesystem
628 normalize the case of a pathname when on a casefolding filesystem
629
629
630 isknown specifies whether the filename came from walking the
630 isknown specifies whether the filename came from walking the
631 disk, to avoid extra filesystem access.
631 disk, to avoid extra filesystem access.
632
632
633 If ignoremissing is True, missing path are returned
633 If ignoremissing is True, missing path are returned
634 unchanged. Otherwise, we try harder to normalize possibly
634 unchanged. Otherwise, we try harder to normalize possibly
635 existing path components.
635 existing path components.
636
636
637 The normalized case is determined based on the following precedence:
637 The normalized case is determined based on the following precedence:
638
638
639 - version of name already stored in the dirstate
639 - version of name already stored in the dirstate
640 - version of name stored on disk
640 - version of name stored on disk
641 - version provided via command arguments
641 - version provided via command arguments
642 """
642 """
643
643
644 if self._checkcase:
644 if self._checkcase:
645 return self._normalize(path, isknown, ignoremissing)
645 return self._normalize(path, isknown, ignoremissing)
646 return path
646 return path
647
647
648 def clear(self):
648 def clear(self):
649 self._map.clear()
649 self._map.clear()
650 self._lastnormaltime = 0
650 self._lastnormaltime = 0
651 self._updatedfiles.clear()
651 self._updatedfiles.clear()
652 self._dirty = True
652 self._dirty = True
653
653
654 def rebuild(self, parent, allfiles, changedfiles=None):
654 def rebuild(self, parent, allfiles, changedfiles=None):
655 if changedfiles is None:
655 if changedfiles is None:
656 # Rebuild entire dirstate
656 # Rebuild entire dirstate
657 to_lookup = allfiles
657 to_lookup = allfiles
658 to_drop = []
658 to_drop = []
659 lastnormaltime = self._lastnormaltime
659 lastnormaltime = self._lastnormaltime
660 self.clear()
660 self.clear()
661 self._lastnormaltime = lastnormaltime
661 self._lastnormaltime = lastnormaltime
662 elif len(changedfiles) < 10:
662 elif len(changedfiles) < 10:
663 # Avoid turning allfiles into a set, which can be expensive if it's
663 # Avoid turning allfiles into a set, which can be expensive if it's
664 # large.
664 # large.
665 to_lookup = []
665 to_lookup = []
666 to_drop = []
666 to_drop = []
667 for f in changedfiles:
667 for f in changedfiles:
668 if f in allfiles:
668 if f in allfiles:
669 to_lookup.append(f)
669 to_lookup.append(f)
670 else:
670 else:
671 to_drop.append(f)
671 to_drop.append(f)
672 else:
672 else:
673 changedfilesset = set(changedfiles)
673 changedfilesset = set(changedfiles)
674 to_lookup = changedfilesset & set(allfiles)
674 to_lookup = changedfilesset & set(allfiles)
675 to_drop = changedfilesset - to_lookup
675 to_drop = changedfilesset - to_lookup
676
676
677 if self._origpl is None:
677 if self._origpl is None:
678 self._origpl = self._pl
678 self._origpl = self._pl
679 self._map.setparents(parent, self._nodeconstants.nullid)
679 self._map.setparents(parent, self._nodeconstants.nullid)
680
680
681 for f in to_lookup:
681 for f in to_lookup:
682 self.normallookup(f)
682 self.normallookup(f)
683 for f in to_drop:
683 for f in to_drop:
684 self.drop(f)
684 self.drop(f)
685
685
686 self._dirty = True
686 self._dirty = True
687
687
688 def identity(self):
688 def identity(self):
689 """Return identity of dirstate itself to detect changing in storage
689 """Return identity of dirstate itself to detect changing in storage
690
690
691 If identity of previous dirstate is equal to this, writing
691 If identity of previous dirstate is equal to this, writing
692 changes based on the former dirstate out can keep consistency.
692 changes based on the former dirstate out can keep consistency.
693 """
693 """
694 return self._map.identity
694 return self._map.identity
695
695
696 def write(self, tr):
696 def write(self, tr):
697 if not self._dirty:
697 if not self._dirty:
698 return
698 return
699
699
700 filename = self._filename
700 filename = self._filename
701 if tr:
701 if tr:
702 # 'dirstate.write()' is not only for writing in-memory
702 # 'dirstate.write()' is not only for writing in-memory
703 # changes out, but also for dropping ambiguous timestamp.
703 # changes out, but also for dropping ambiguous timestamp.
704 # delayed writing re-raise "ambiguous timestamp issue".
704 # delayed writing re-raise "ambiguous timestamp issue".
705 # See also the wiki page below for detail:
705 # See also the wiki page below for detail:
706 # https://www.mercurial-scm.org/wiki/DirstateTransactionPlan
706 # https://www.mercurial-scm.org/wiki/DirstateTransactionPlan
707
707
708 # emulate dropping timestamp in 'parsers.pack_dirstate'
708 # emulate dropping timestamp in 'parsers.pack_dirstate'
709 now = _getfsnow(self._opener)
709 now = _getfsnow(self._opener)
710 self._map.clearambiguoustimes(self._updatedfiles, now)
710 self._map.clearambiguoustimes(self._updatedfiles, now)
711
711
712 # emulate that all 'dirstate.normal' results are written out
712 # emulate that all 'dirstate.normal' results are written out
713 self._lastnormaltime = 0
713 self._lastnormaltime = 0
714 self._updatedfiles.clear()
714 self._updatedfiles.clear()
715
715
716 # delay writing in-memory changes out
716 # delay writing in-memory changes out
717 tr.addfilegenerator(
717 tr.addfilegenerator(
718 b'dirstate',
718 b'dirstate',
719 (self._filename,),
719 (self._filename,),
720 self._writedirstate,
720 self._writedirstate,
721 location=b'plain',
721 location=b'plain',
722 )
722 )
723 return
723 return
724
724
725 st = self._opener(filename, b"w", atomictemp=True, checkambig=True)
725 st = self._opener(filename, b"w", atomictemp=True, checkambig=True)
726 self._writedirstate(st)
726 self._writedirstate(st)
727
727
728 def addparentchangecallback(self, category, callback):
728 def addparentchangecallback(self, category, callback):
729 """add a callback to be called when the wd parents are changed
729 """add a callback to be called when the wd parents are changed
730
730
731 Callback will be called with the following arguments:
731 Callback will be called with the following arguments:
732 dirstate, (oldp1, oldp2), (newp1, newp2)
732 dirstate, (oldp1, oldp2), (newp1, newp2)
733
733
734 Category is a unique identifier to allow overwriting an old callback
734 Category is a unique identifier to allow overwriting an old callback
735 with a newer callback.
735 with a newer callback.
736 """
736 """
737 self._plchangecallbacks[category] = callback
737 self._plchangecallbacks[category] = callback
738
738
739 def _writedirstate(self, st):
739 def _writedirstate(self, st):
740 # notify callbacks about parents change
740 # notify callbacks about parents change
741 if self._origpl is not None and self._origpl != self._pl:
741 if self._origpl is not None and self._origpl != self._pl:
742 for c, callback in sorted(
742 for c, callback in sorted(
743 pycompat.iteritems(self._plchangecallbacks)
743 pycompat.iteritems(self._plchangecallbacks)
744 ):
744 ):
745 callback(self, self._origpl, self._pl)
745 callback(self, self._origpl, self._pl)
746 self._origpl = None
746 self._origpl = None
747 # use the modification time of the newly created temporary file as the
747 # use the modification time of the newly created temporary file as the
748 # filesystem's notion of 'now'
748 # filesystem's notion of 'now'
749 now = util.fstat(st)[stat.ST_MTIME] & _rangemask
749 now = util.fstat(st)[stat.ST_MTIME] & _rangemask
750
750
751 # enough 'delaywrite' prevents 'pack_dirstate' from dropping
751 # enough 'delaywrite' prevents 'pack_dirstate' from dropping
752 # timestamp of each entries in dirstate, because of 'now > mtime'
752 # timestamp of each entries in dirstate, because of 'now > mtime'
753 delaywrite = self._ui.configint(b'debug', b'dirstate.delaywrite')
753 delaywrite = self._ui.configint(b'debug', b'dirstate.delaywrite')
754 if delaywrite > 0:
754 if delaywrite > 0:
755 # do we have any files to delay for?
755 # do we have any files to delay for?
756 for f, e in pycompat.iteritems(self._map):
756 for f, e in pycompat.iteritems(self._map):
757 if e.state == b'n' and e[3] == now:
757 if e.state == b'n' and e[3] == now:
758 import time # to avoid useless import
758 import time # to avoid useless import
759
759
760 # rather than sleep n seconds, sleep until the next
760 # rather than sleep n seconds, sleep until the next
761 # multiple of n seconds
761 # multiple of n seconds
762 clock = time.time()
762 clock = time.time()
763 start = int(clock) - (int(clock) % delaywrite)
763 start = int(clock) - (int(clock) % delaywrite)
764 end = start + delaywrite
764 end = start + delaywrite
765 time.sleep(end - clock)
765 time.sleep(end - clock)
766 now = end # trust our estimate that the end is near now
766 now = end # trust our estimate that the end is near now
767 break
767 break
768
768
769 self._map.write(st, now)
769 self._map.write(st, now)
770 self._lastnormaltime = 0
770 self._lastnormaltime = 0
771 self._dirty = False
771 self._dirty = False
772
772
773 def _dirignore(self, f):
773 def _dirignore(self, f):
774 if self._ignore(f):
774 if self._ignore(f):
775 return True
775 return True
776 for p in pathutil.finddirs(f):
776 for p in pathutil.finddirs(f):
777 if self._ignore(p):
777 if self._ignore(p):
778 return True
778 return True
779 return False
779 return False
780
780
781 def _ignorefiles(self):
781 def _ignorefiles(self):
782 files = []
782 files = []
783 if os.path.exists(self._join(b'.hgignore')):
783 if os.path.exists(self._join(b'.hgignore')):
784 files.append(self._join(b'.hgignore'))
784 files.append(self._join(b'.hgignore'))
785 for name, path in self._ui.configitems(b"ui"):
785 for name, path in self._ui.configitems(b"ui"):
786 if name == b'ignore' or name.startswith(b'ignore.'):
786 if name == b'ignore' or name.startswith(b'ignore.'):
787 # we need to use os.path.join here rather than self._join
787 # we need to use os.path.join here rather than self._join
788 # because path is arbitrary and user-specified
788 # because path is arbitrary and user-specified
789 files.append(os.path.join(self._rootdir, util.expandpath(path)))
789 files.append(os.path.join(self._rootdir, util.expandpath(path)))
790 return files
790 return files
791
791
792 def _ignorefileandline(self, f):
792 def _ignorefileandline(self, f):
793 files = collections.deque(self._ignorefiles())
793 files = collections.deque(self._ignorefiles())
794 visited = set()
794 visited = set()
795 while files:
795 while files:
796 i = files.popleft()
796 i = files.popleft()
797 patterns = matchmod.readpatternfile(
797 patterns = matchmod.readpatternfile(
798 i, self._ui.warn, sourceinfo=True
798 i, self._ui.warn, sourceinfo=True
799 )
799 )
800 for pattern, lineno, line in patterns:
800 for pattern, lineno, line in patterns:
801 kind, p = matchmod._patsplit(pattern, b'glob')
801 kind, p = matchmod._patsplit(pattern, b'glob')
802 if kind == b"subinclude":
802 if kind == b"subinclude":
803 if p not in visited:
803 if p not in visited:
804 files.append(p)
804 files.append(p)
805 continue
805 continue
806 m = matchmod.match(
806 m = matchmod.match(
807 self._root, b'', [], [pattern], warn=self._ui.warn
807 self._root, b'', [], [pattern], warn=self._ui.warn
808 )
808 )
809 if m(f):
809 if m(f):
810 return (i, lineno, line)
810 return (i, lineno, line)
811 visited.add(i)
811 visited.add(i)
812 return (None, -1, b"")
812 return (None, -1, b"")
813
813
814 def _walkexplicit(self, match, subrepos):
814 def _walkexplicit(self, match, subrepos):
815 """Get stat data about the files explicitly specified by match.
815 """Get stat data about the files explicitly specified by match.
816
816
817 Return a triple (results, dirsfound, dirsnotfound).
817 Return a triple (results, dirsfound, dirsnotfound).
818 - results is a mapping from filename to stat result. It also contains
818 - results is a mapping from filename to stat result. It also contains
819 listings mapping subrepos and .hg to None.
819 listings mapping subrepos and .hg to None.
820 - dirsfound is a list of files found to be directories.
820 - dirsfound is a list of files found to be directories.
821 - dirsnotfound is a list of files that the dirstate thinks are
821 - dirsnotfound is a list of files that the dirstate thinks are
822 directories and that were not found."""
822 directories and that were not found."""
823
823
824 def badtype(mode):
824 def badtype(mode):
825 kind = _(b'unknown')
825 kind = _(b'unknown')
826 if stat.S_ISCHR(mode):
826 if stat.S_ISCHR(mode):
827 kind = _(b'character device')
827 kind = _(b'character device')
828 elif stat.S_ISBLK(mode):
828 elif stat.S_ISBLK(mode):
829 kind = _(b'block device')
829 kind = _(b'block device')
830 elif stat.S_ISFIFO(mode):
830 elif stat.S_ISFIFO(mode):
831 kind = _(b'fifo')
831 kind = _(b'fifo')
832 elif stat.S_ISSOCK(mode):
832 elif stat.S_ISSOCK(mode):
833 kind = _(b'socket')
833 kind = _(b'socket')
834 elif stat.S_ISDIR(mode):
834 elif stat.S_ISDIR(mode):
835 kind = _(b'directory')
835 kind = _(b'directory')
836 return _(b'unsupported file type (type is %s)') % kind
836 return _(b'unsupported file type (type is %s)') % kind
837
837
838 badfn = match.bad
838 badfn = match.bad
839 dmap = self._map
839 dmap = self._map
840 lstat = os.lstat
840 lstat = os.lstat
841 getkind = stat.S_IFMT
841 getkind = stat.S_IFMT
842 dirkind = stat.S_IFDIR
842 dirkind = stat.S_IFDIR
843 regkind = stat.S_IFREG
843 regkind = stat.S_IFREG
844 lnkkind = stat.S_IFLNK
844 lnkkind = stat.S_IFLNK
845 join = self._join
845 join = self._join
846 dirsfound = []
846 dirsfound = []
847 foundadd = dirsfound.append
847 foundadd = dirsfound.append
848 dirsnotfound = []
848 dirsnotfound = []
849 notfoundadd = dirsnotfound.append
849 notfoundadd = dirsnotfound.append
850
850
851 if not match.isexact() and self._checkcase:
851 if not match.isexact() and self._checkcase:
852 normalize = self._normalize
852 normalize = self._normalize
853 else:
853 else:
854 normalize = None
854 normalize = None
855
855
856 files = sorted(match.files())
856 files = sorted(match.files())
857 subrepos.sort()
857 subrepos.sort()
858 i, j = 0, 0
858 i, j = 0, 0
859 while i < len(files) and j < len(subrepos):
859 while i < len(files) and j < len(subrepos):
860 subpath = subrepos[j] + b"/"
860 subpath = subrepos[j] + b"/"
861 if files[i] < subpath:
861 if files[i] < subpath:
862 i += 1
862 i += 1
863 continue
863 continue
864 while i < len(files) and files[i].startswith(subpath):
864 while i < len(files) and files[i].startswith(subpath):
865 del files[i]
865 del files[i]
866 j += 1
866 j += 1
867
867
868 if not files or b'' in files:
868 if not files or b'' in files:
869 files = [b'']
869 files = [b'']
870 # constructing the foldmap is expensive, so don't do it for the
870 # constructing the foldmap is expensive, so don't do it for the
871 # common case where files is ['']
871 # common case where files is ['']
872 normalize = None
872 normalize = None
873 results = dict.fromkeys(subrepos)
873 results = dict.fromkeys(subrepos)
874 results[b'.hg'] = None
874 results[b'.hg'] = None
875
875
876 for ff in files:
876 for ff in files:
877 if normalize:
877 if normalize:
878 nf = normalize(ff, False, True)
878 nf = normalize(ff, False, True)
879 else:
879 else:
880 nf = ff
880 nf = ff
881 if nf in results:
881 if nf in results:
882 continue
882 continue
883
883
884 try:
884 try:
885 st = lstat(join(nf))
885 st = lstat(join(nf))
886 kind = getkind(st.st_mode)
886 kind = getkind(st.st_mode)
887 if kind == dirkind:
887 if kind == dirkind:
888 if nf in dmap:
888 if nf in dmap:
889 # file replaced by dir on disk but still in dirstate
889 # file replaced by dir on disk but still in dirstate
890 results[nf] = None
890 results[nf] = None
891 foundadd((nf, ff))
891 foundadd((nf, ff))
892 elif kind == regkind or kind == lnkkind:
892 elif kind == regkind or kind == lnkkind:
893 results[nf] = st
893 results[nf] = st
894 else:
894 else:
895 badfn(ff, badtype(kind))
895 badfn(ff, badtype(kind))
896 if nf in dmap:
896 if nf in dmap:
897 results[nf] = None
897 results[nf] = None
898 except OSError as inst: # nf not found on disk - it is dirstate only
898 except OSError as inst: # nf not found on disk - it is dirstate only
899 if nf in dmap: # does it exactly match a missing file?
899 if nf in dmap: # does it exactly match a missing file?
900 results[nf] = None
900 results[nf] = None
901 else: # does it match a missing directory?
901 else: # does it match a missing directory?
902 if self._map.hasdir(nf):
902 if self._map.hasdir(nf):
903 notfoundadd(nf)
903 notfoundadd(nf)
904 else:
904 else:
905 badfn(ff, encoding.strtolocal(inst.strerror))
905 badfn(ff, encoding.strtolocal(inst.strerror))
906
906
907 # match.files() may contain explicitly-specified paths that shouldn't
907 # match.files() may contain explicitly-specified paths that shouldn't
908 # be taken; drop them from the list of files found. dirsfound/notfound
908 # be taken; drop them from the list of files found. dirsfound/notfound
909 # aren't filtered here because they will be tested later.
909 # aren't filtered here because they will be tested later.
910 if match.anypats():
910 if match.anypats():
911 for f in list(results):
911 for f in list(results):
912 if f == b'.hg' or f in subrepos:
912 if f == b'.hg' or f in subrepos:
913 # keep sentinel to disable further out-of-repo walks
913 # keep sentinel to disable further out-of-repo walks
914 continue
914 continue
915 if not match(f):
915 if not match(f):
916 del results[f]
916 del results[f]
917
917
918 # Case insensitive filesystems cannot rely on lstat() failing to detect
918 # Case insensitive filesystems cannot rely on lstat() failing to detect
919 # a case-only rename. Prune the stat object for any file that does not
919 # a case-only rename. Prune the stat object for any file that does not
920 # match the case in the filesystem, if there are multiple files that
920 # match the case in the filesystem, if there are multiple files that
921 # normalize to the same path.
921 # normalize to the same path.
922 if match.isexact() and self._checkcase:
922 if match.isexact() and self._checkcase:
923 normed = {}
923 normed = {}
924
924
925 for f, st in pycompat.iteritems(results):
925 for f, st in pycompat.iteritems(results):
926 if st is None:
926 if st is None:
927 continue
927 continue
928
928
929 nc = util.normcase(f)
929 nc = util.normcase(f)
930 paths = normed.get(nc)
930 paths = normed.get(nc)
931
931
932 if paths is None:
932 if paths is None:
933 paths = set()
933 paths = set()
934 normed[nc] = paths
934 normed[nc] = paths
935
935
936 paths.add(f)
936 paths.add(f)
937
937
938 for norm, paths in pycompat.iteritems(normed):
938 for norm, paths in pycompat.iteritems(normed):
939 if len(paths) > 1:
939 if len(paths) > 1:
940 for path in paths:
940 for path in paths:
941 folded = self._discoverpath(
941 folded = self._discoverpath(
942 path, norm, True, None, self._map.dirfoldmap
942 path, norm, True, None, self._map.dirfoldmap
943 )
943 )
944 if path != folded:
944 if path != folded:
945 results[path] = None
945 results[path] = None
946
946
947 return results, dirsfound, dirsnotfound
947 return results, dirsfound, dirsnotfound
948
948
949 def walk(self, match, subrepos, unknown, ignored, full=True):
949 def walk(self, match, subrepos, unknown, ignored, full=True):
950 """
950 """
951 Walk recursively through the directory tree, finding all files
951 Walk recursively through the directory tree, finding all files
952 matched by match.
952 matched by match.
953
953
954 If full is False, maybe skip some known-clean files.
954 If full is False, maybe skip some known-clean files.
955
955
956 Return a dict mapping filename to stat-like object (either
956 Return a dict mapping filename to stat-like object (either
957 mercurial.osutil.stat instance or return value of os.stat()).
957 mercurial.osutil.stat instance or return value of os.stat()).
958
958
959 """
959 """
960 # full is a flag that extensions that hook into walk can use -- this
960 # full is a flag that extensions that hook into walk can use -- this
961 # implementation doesn't use it at all. This satisfies the contract
961 # implementation doesn't use it at all. This satisfies the contract
962 # because we only guarantee a "maybe".
962 # because we only guarantee a "maybe".
963
963
964 if ignored:
964 if ignored:
965 ignore = util.never
965 ignore = util.never
966 dirignore = util.never
966 dirignore = util.never
967 elif unknown:
967 elif unknown:
968 ignore = self._ignore
968 ignore = self._ignore
969 dirignore = self._dirignore
969 dirignore = self._dirignore
970 else:
970 else:
971 # if not unknown and not ignored, drop dir recursion and step 2
971 # if not unknown and not ignored, drop dir recursion and step 2
972 ignore = util.always
972 ignore = util.always
973 dirignore = util.always
973 dirignore = util.always
974
974
975 matchfn = match.matchfn
975 matchfn = match.matchfn
976 matchalways = match.always()
976 matchalways = match.always()
977 matchtdir = match.traversedir
977 matchtdir = match.traversedir
978 dmap = self._map
978 dmap = self._map
979 listdir = util.listdir
979 listdir = util.listdir
980 lstat = os.lstat
980 lstat = os.lstat
981 dirkind = stat.S_IFDIR
981 dirkind = stat.S_IFDIR
982 regkind = stat.S_IFREG
982 regkind = stat.S_IFREG
983 lnkkind = stat.S_IFLNK
983 lnkkind = stat.S_IFLNK
984 join = self._join
984 join = self._join
985
985
986 exact = skipstep3 = False
986 exact = skipstep3 = False
987 if match.isexact(): # match.exact
987 if match.isexact(): # match.exact
988 exact = True
988 exact = True
989 dirignore = util.always # skip step 2
989 dirignore = util.always # skip step 2
990 elif match.prefix(): # match.match, no patterns
990 elif match.prefix(): # match.match, no patterns
991 skipstep3 = True
991 skipstep3 = True
992
992
993 if not exact and self._checkcase:
993 if not exact and self._checkcase:
994 normalize = self._normalize
994 normalize = self._normalize
995 normalizefile = self._normalizefile
995 normalizefile = self._normalizefile
996 skipstep3 = False
996 skipstep3 = False
997 else:
997 else:
998 normalize = self._normalize
998 normalize = self._normalize
999 normalizefile = None
999 normalizefile = None
1000
1000
1001 # step 1: find all explicit files
1001 # step 1: find all explicit files
1002 results, work, dirsnotfound = self._walkexplicit(match, subrepos)
1002 results, work, dirsnotfound = self._walkexplicit(match, subrepos)
1003 if matchtdir:
1003 if matchtdir:
1004 for d in work:
1004 for d in work:
1005 matchtdir(d[0])
1005 matchtdir(d[0])
1006 for d in dirsnotfound:
1006 for d in dirsnotfound:
1007 matchtdir(d)
1007 matchtdir(d)
1008
1008
1009 skipstep3 = skipstep3 and not (work or dirsnotfound)
1009 skipstep3 = skipstep3 and not (work or dirsnotfound)
1010 work = [d for d in work if not dirignore(d[0])]
1010 work = [d for d in work if not dirignore(d[0])]
1011
1011
1012 # step 2: visit subdirectories
1012 # step 2: visit subdirectories
1013 def traverse(work, alreadynormed):
1013 def traverse(work, alreadynormed):
1014 wadd = work.append
1014 wadd = work.append
1015 while work:
1015 while work:
1016 tracing.counter('dirstate.walk work', len(work))
1016 tracing.counter('dirstate.walk work', len(work))
1017 nd = work.pop()
1017 nd = work.pop()
1018 visitentries = match.visitchildrenset(nd)
1018 visitentries = match.visitchildrenset(nd)
1019 if not visitentries:
1019 if not visitentries:
1020 continue
1020 continue
1021 if visitentries == b'this' or visitentries == b'all':
1021 if visitentries == b'this' or visitentries == b'all':
1022 visitentries = None
1022 visitentries = None
1023 skip = None
1023 skip = None
1024 if nd != b'':
1024 if nd != b'':
1025 skip = b'.hg'
1025 skip = b'.hg'
1026 try:
1026 try:
1027 with tracing.log('dirstate.walk.traverse listdir %s', nd):
1027 with tracing.log('dirstate.walk.traverse listdir %s', nd):
1028 entries = listdir(join(nd), stat=True, skip=skip)
1028 entries = listdir(join(nd), stat=True, skip=skip)
1029 except OSError as inst:
1029 except OSError as inst:
1030 if inst.errno in (errno.EACCES, errno.ENOENT):
1030 if inst.errno in (errno.EACCES, errno.ENOENT):
1031 match.bad(
1031 match.bad(
1032 self.pathto(nd), encoding.strtolocal(inst.strerror)
1032 self.pathto(nd), encoding.strtolocal(inst.strerror)
1033 )
1033 )
1034 continue
1034 continue
1035 raise
1035 raise
1036 for f, kind, st in entries:
1036 for f, kind, st in entries:
1037 # Some matchers may return files in the visitentries set,
1037 # Some matchers may return files in the visitentries set,
1038 # instead of 'this', if the matcher explicitly mentions them
1038 # instead of 'this', if the matcher explicitly mentions them
1039 # and is not an exactmatcher. This is acceptable; we do not
1039 # and is not an exactmatcher. This is acceptable; we do not
1040 # make any hard assumptions about file-or-directory below
1040 # make any hard assumptions about file-or-directory below
1041 # based on the presence of `f` in visitentries. If
1041 # based on the presence of `f` in visitentries. If
1042 # visitchildrenset returned a set, we can always skip the
1042 # visitchildrenset returned a set, we can always skip the
1043 # entries *not* in the set it provided regardless of whether
1043 # entries *not* in the set it provided regardless of whether
1044 # they're actually a file or a directory.
1044 # they're actually a file or a directory.
1045 if visitentries and f not in visitentries:
1045 if visitentries and f not in visitentries:
1046 continue
1046 continue
1047 if normalizefile:
1047 if normalizefile:
1048 # even though f might be a directory, we're only
1048 # even though f might be a directory, we're only
1049 # interested in comparing it to files currently in the
1049 # interested in comparing it to files currently in the
1050 # dmap -- therefore normalizefile is enough
1050 # dmap -- therefore normalizefile is enough
1051 nf = normalizefile(
1051 nf = normalizefile(
1052 nd and (nd + b"/" + f) or f, True, True
1052 nd and (nd + b"/" + f) or f, True, True
1053 )
1053 )
1054 else:
1054 else:
1055 nf = nd and (nd + b"/" + f) or f
1055 nf = nd and (nd + b"/" + f) or f
1056 if nf not in results:
1056 if nf not in results:
1057 if kind == dirkind:
1057 if kind == dirkind:
1058 if not ignore(nf):
1058 if not ignore(nf):
1059 if matchtdir:
1059 if matchtdir:
1060 matchtdir(nf)
1060 matchtdir(nf)
1061 wadd(nf)
1061 wadd(nf)
1062 if nf in dmap and (matchalways or matchfn(nf)):
1062 if nf in dmap and (matchalways or matchfn(nf)):
1063 results[nf] = None
1063 results[nf] = None
1064 elif kind == regkind or kind == lnkkind:
1064 elif kind == regkind or kind == lnkkind:
1065 if nf in dmap:
1065 if nf in dmap:
1066 if matchalways or matchfn(nf):
1066 if matchalways or matchfn(nf):
1067 results[nf] = st
1067 results[nf] = st
1068 elif (matchalways or matchfn(nf)) and not ignore(
1068 elif (matchalways or matchfn(nf)) and not ignore(
1069 nf
1069 nf
1070 ):
1070 ):
1071 # unknown file -- normalize if necessary
1071 # unknown file -- normalize if necessary
1072 if not alreadynormed:
1072 if not alreadynormed:
1073 nf = normalize(nf, False, True)
1073 nf = normalize(nf, False, True)
1074 results[nf] = st
1074 results[nf] = st
1075 elif nf in dmap and (matchalways or matchfn(nf)):
1075 elif nf in dmap and (matchalways or matchfn(nf)):
1076 results[nf] = None
1076 results[nf] = None
1077
1077
1078 for nd, d in work:
1078 for nd, d in work:
1079 # alreadynormed means that processwork doesn't have to do any
1079 # alreadynormed means that processwork doesn't have to do any
1080 # expensive directory normalization
1080 # expensive directory normalization
1081 alreadynormed = not normalize or nd == d
1081 alreadynormed = not normalize or nd == d
1082 traverse([d], alreadynormed)
1082 traverse([d], alreadynormed)
1083
1083
1084 for s in subrepos:
1084 for s in subrepos:
1085 del results[s]
1085 del results[s]
1086 del results[b'.hg']
1086 del results[b'.hg']
1087
1087
1088 # step 3: visit remaining files from dmap
1088 # step 3: visit remaining files from dmap
1089 if not skipstep3 and not exact:
1089 if not skipstep3 and not exact:
1090 # If a dmap file is not in results yet, it was either
1090 # If a dmap file is not in results yet, it was either
1091 # a) not matching matchfn b) ignored, c) missing, or d) under a
1091 # a) not matching matchfn b) ignored, c) missing, or d) under a
1092 # symlink directory.
1092 # symlink directory.
1093 if not results and matchalways:
1093 if not results and matchalways:
1094 visit = [f for f in dmap]
1094 visit = [f for f in dmap]
1095 else:
1095 else:
1096 visit = [f for f in dmap if f not in results and matchfn(f)]
1096 visit = [f for f in dmap if f not in results and matchfn(f)]
1097 visit.sort()
1097 visit.sort()
1098
1098
1099 if unknown:
1099 if unknown:
1100 # unknown == True means we walked all dirs under the roots
1100 # unknown == True means we walked all dirs under the roots
1101 # that wasn't ignored, and everything that matched was stat'ed
1101 # that wasn't ignored, and everything that matched was stat'ed
1102 # and is already in results.
1102 # and is already in results.
1103 # The rest must thus be ignored or under a symlink.
1103 # The rest must thus be ignored or under a symlink.
1104 audit_path = pathutil.pathauditor(self._root, cached=True)
1104 audit_path = pathutil.pathauditor(self._root, cached=True)
1105
1105
1106 for nf in iter(visit):
1106 for nf in iter(visit):
1107 # If a stat for the same file was already added with a
1107 # If a stat for the same file was already added with a
1108 # different case, don't add one for this, since that would
1108 # different case, don't add one for this, since that would
1109 # make it appear as if the file exists under both names
1109 # make it appear as if the file exists under both names
1110 # on disk.
1110 # on disk.
1111 if (
1111 if (
1112 normalizefile
1112 normalizefile
1113 and normalizefile(nf, True, True) in results
1113 and normalizefile(nf, True, True) in results
1114 ):
1114 ):
1115 results[nf] = None
1115 results[nf] = None
1116 # Report ignored items in the dmap as long as they are not
1116 # Report ignored items in the dmap as long as they are not
1117 # under a symlink directory.
1117 # under a symlink directory.
1118 elif audit_path.check(nf):
1118 elif audit_path.check(nf):
1119 try:
1119 try:
1120 results[nf] = lstat(join(nf))
1120 results[nf] = lstat(join(nf))
1121 # file was just ignored, no links, and exists
1121 # file was just ignored, no links, and exists
1122 except OSError:
1122 except OSError:
1123 # file doesn't exist
1123 # file doesn't exist
1124 results[nf] = None
1124 results[nf] = None
1125 else:
1125 else:
1126 # It's either missing or under a symlink directory
1126 # It's either missing or under a symlink directory
1127 # which we in this case report as missing
1127 # which we in this case report as missing
1128 results[nf] = None
1128 results[nf] = None
1129 else:
1129 else:
1130 # We may not have walked the full directory tree above,
1130 # We may not have walked the full directory tree above,
1131 # so stat and check everything we missed.
1131 # so stat and check everything we missed.
1132 iv = iter(visit)
1132 iv = iter(visit)
1133 for st in util.statfiles([join(i) for i in visit]):
1133 for st in util.statfiles([join(i) for i in visit]):
1134 results[next(iv)] = st
1134 results[next(iv)] = st
1135 return results
1135 return results
1136
1136
1137 def _rust_status(self, matcher, list_clean, list_ignored, list_unknown):
1137 def _rust_status(self, matcher, list_clean, list_ignored, list_unknown):
1138 # Force Rayon (Rust parallelism library) to respect the number of
1138 # Force Rayon (Rust parallelism library) to respect the number of
1139 # workers. This is a temporary workaround until Rust code knows
1139 # workers. This is a temporary workaround until Rust code knows
1140 # how to read the config file.
1140 # how to read the config file.
1141 numcpus = self._ui.configint(b"worker", b"numcpus")
1141 numcpus = self._ui.configint(b"worker", b"numcpus")
1142 if numcpus is not None:
1142 if numcpus is not None:
1143 encoding.environ.setdefault(b'RAYON_NUM_THREADS', b'%d' % numcpus)
1143 encoding.environ.setdefault(b'RAYON_NUM_THREADS', b'%d' % numcpus)
1144
1144
1145 workers_enabled = self._ui.configbool(b"worker", b"enabled", True)
1145 workers_enabled = self._ui.configbool(b"worker", b"enabled", True)
1146 if not workers_enabled:
1146 if not workers_enabled:
1147 encoding.environ[b"RAYON_NUM_THREADS"] = b"1"
1147 encoding.environ[b"RAYON_NUM_THREADS"] = b"1"
1148
1148
1149 (
1149 (
1150 lookup,
1150 lookup,
1151 modified,
1151 modified,
1152 added,
1152 added,
1153 removed,
1153 removed,
1154 deleted,
1154 deleted,
1155 clean,
1155 clean,
1156 ignored,
1156 ignored,
1157 unknown,
1157 unknown,
1158 warnings,
1158 warnings,
1159 bad,
1159 bad,
1160 traversed,
1160 traversed,
1161 dirty,
1161 dirty,
1162 ) = rustmod.status(
1162 ) = rustmod.status(
1163 self._map._rustmap,
1163 self._map._rustmap,
1164 matcher,
1164 matcher,
1165 self._rootdir,
1165 self._rootdir,
1166 self._ignorefiles(),
1166 self._ignorefiles(),
1167 self._checkexec,
1167 self._checkexec,
1168 self._lastnormaltime,
1168 self._lastnormaltime,
1169 bool(list_clean),
1169 bool(list_clean),
1170 bool(list_ignored),
1170 bool(list_ignored),
1171 bool(list_unknown),
1171 bool(list_unknown),
1172 bool(matcher.traversedir),
1172 bool(matcher.traversedir),
1173 )
1173 )
1174
1174
1175 self._dirty |= dirty
1175 self._dirty |= dirty
1176
1176
1177 if matcher.traversedir:
1177 if matcher.traversedir:
1178 for dir in traversed:
1178 for dir in traversed:
1179 matcher.traversedir(dir)
1179 matcher.traversedir(dir)
1180
1180
1181 if self._ui.warn:
1181 if self._ui.warn:
1182 for item in warnings:
1182 for item in warnings:
1183 if isinstance(item, tuple):
1183 if isinstance(item, tuple):
1184 file_path, syntax = item
1184 file_path, syntax = item
1185 msg = _(b"%s: ignoring invalid syntax '%s'\n") % (
1185 msg = _(b"%s: ignoring invalid syntax '%s'\n") % (
1186 file_path,
1186 file_path,
1187 syntax,
1187 syntax,
1188 )
1188 )
1189 self._ui.warn(msg)
1189 self._ui.warn(msg)
1190 else:
1190 else:
1191 msg = _(b"skipping unreadable pattern file '%s': %s\n")
1191 msg = _(b"skipping unreadable pattern file '%s': %s\n")
1192 self._ui.warn(
1192 self._ui.warn(
1193 msg
1193 msg
1194 % (
1194 % (
1195 pathutil.canonpath(
1195 pathutil.canonpath(
1196 self._rootdir, self._rootdir, item
1196 self._rootdir, self._rootdir, item
1197 ),
1197 ),
1198 b"No such file or directory",
1198 b"No such file or directory",
1199 )
1199 )
1200 )
1200 )
1201
1201
1202 for (fn, message) in bad:
1202 for (fn, message) in bad:
1203 matcher.bad(fn, encoding.strtolocal(message))
1203 matcher.bad(fn, encoding.strtolocal(message))
1204
1204
1205 status = scmutil.status(
1205 status = scmutil.status(
1206 modified=modified,
1206 modified=modified,
1207 added=added,
1207 added=added,
1208 removed=removed,
1208 removed=removed,
1209 deleted=deleted,
1209 deleted=deleted,
1210 unknown=unknown,
1210 unknown=unknown,
1211 ignored=ignored,
1211 ignored=ignored,
1212 clean=clean,
1212 clean=clean,
1213 )
1213 )
1214 return (lookup, status)
1214 return (lookup, status)
1215
1215
1216 def status(self, match, subrepos, ignored, clean, unknown):
1216 def status(self, match, subrepos, ignored, clean, unknown):
1217 """Determine the status of the working copy relative to the
1217 """Determine the status of the working copy relative to the
1218 dirstate and return a pair of (unsure, status), where status is of type
1218 dirstate and return a pair of (unsure, status), where status is of type
1219 scmutil.status and:
1219 scmutil.status and:
1220
1220
1221 unsure:
1221 unsure:
1222 files that might have been modified since the dirstate was
1222 files that might have been modified since the dirstate was
1223 written, but need to be read to be sure (size is the same
1223 written, but need to be read to be sure (size is the same
1224 but mtime differs)
1224 but mtime differs)
1225 status.modified:
1225 status.modified:
1226 files that have definitely been modified since the dirstate
1226 files that have definitely been modified since the dirstate
1227 was written (different size or mode)
1227 was written (different size or mode)
1228 status.clean:
1228 status.clean:
1229 files that have definitely not been modified since the
1229 files that have definitely not been modified since the
1230 dirstate was written
1230 dirstate was written
1231 """
1231 """
1232 listignored, listclean, listunknown = ignored, clean, unknown
1232 listignored, listclean, listunknown = ignored, clean, unknown
1233 lookup, modified, added, unknown, ignored = [], [], [], [], []
1233 lookup, modified, added, unknown, ignored = [], [], [], [], []
1234 removed, deleted, clean = [], [], []
1234 removed, deleted, clean = [], [], []
1235
1235
1236 dmap = self._map
1236 dmap = self._map
1237 dmap.preload()
1237 dmap.preload()
1238
1238
1239 use_rust = True
1239 use_rust = True
1240
1240
1241 allowed_matchers = (
1241 allowed_matchers = (
1242 matchmod.alwaysmatcher,
1242 matchmod.alwaysmatcher,
1243 matchmod.exactmatcher,
1243 matchmod.exactmatcher,
1244 matchmod.includematcher,
1244 matchmod.includematcher,
1245 )
1245 )
1246
1246
1247 if rustmod is None:
1247 if rustmod is None:
1248 use_rust = False
1248 use_rust = False
1249 elif self._checkcase:
1249 elif self._checkcase:
1250 # Case-insensitive filesystems are not handled yet
1250 # Case-insensitive filesystems are not handled yet
1251 use_rust = False
1251 use_rust = False
1252 elif subrepos:
1252 elif subrepos:
1253 use_rust = False
1253 use_rust = False
1254 elif sparse.enabled:
1254 elif sparse.enabled:
1255 use_rust = False
1255 use_rust = False
1256 elif not isinstance(match, allowed_matchers):
1256 elif not isinstance(match, allowed_matchers):
1257 # Some matchers have yet to be implemented
1257 # Some matchers have yet to be implemented
1258 use_rust = False
1258 use_rust = False
1259
1259
1260 if use_rust:
1260 if use_rust:
1261 try:
1261 try:
1262 return self._rust_status(
1262 return self._rust_status(
1263 match, listclean, listignored, listunknown
1263 match, listclean, listignored, listunknown
1264 )
1264 )
1265 except rustmod.FallbackError:
1265 except rustmod.FallbackError:
1266 pass
1266 pass
1267
1267
1268 def noop(f):
1268 def noop(f):
1269 pass
1269 pass
1270
1270
1271 dcontains = dmap.__contains__
1271 dcontains = dmap.__contains__
1272 dget = dmap.__getitem__
1272 dget = dmap.__getitem__
1273 ladd = lookup.append # aka "unsure"
1273 ladd = lookup.append # aka "unsure"
1274 madd = modified.append
1274 madd = modified.append
1275 aadd = added.append
1275 aadd = added.append
1276 uadd = unknown.append if listunknown else noop
1276 uadd = unknown.append if listunknown else noop
1277 iadd = ignored.append if listignored else noop
1277 iadd = ignored.append if listignored else noop
1278 radd = removed.append
1278 radd = removed.append
1279 dadd = deleted.append
1279 dadd = deleted.append
1280 cadd = clean.append if listclean else noop
1280 cadd = clean.append if listclean else noop
1281 mexact = match.exact
1281 mexact = match.exact
1282 dirignore = self._dirignore
1282 dirignore = self._dirignore
1283 checkexec = self._checkexec
1283 checkexec = self._checkexec
1284 copymap = self._map.copymap
1284 copymap = self._map.copymap
1285 lastnormaltime = self._lastnormaltime
1285 lastnormaltime = self._lastnormaltime
1286
1286
1287 # We need to do full walks when either
1287 # We need to do full walks when either
1288 # - we're listing all clean files, or
1288 # - we're listing all clean files, or
1289 # - match.traversedir does something, because match.traversedir should
1289 # - match.traversedir does something, because match.traversedir should
1290 # be called for every dir in the working dir
1290 # be called for every dir in the working dir
1291 full = listclean or match.traversedir is not None
1291 full = listclean or match.traversedir is not None
1292 for fn, st in pycompat.iteritems(
1292 for fn, st in pycompat.iteritems(
1293 self.walk(match, subrepos, listunknown, listignored, full=full)
1293 self.walk(match, subrepos, listunknown, listignored, full=full)
1294 ):
1294 ):
1295 if not dcontains(fn):
1295 if not dcontains(fn):
1296 if (listignored or mexact(fn)) and dirignore(fn):
1296 if (listignored or mexact(fn)) and dirignore(fn):
1297 if listignored:
1297 if listignored:
1298 iadd(fn)
1298 iadd(fn)
1299 else:
1299 else:
1300 uadd(fn)
1300 uadd(fn)
1301 continue
1301 continue
1302
1302
1303 # This is equivalent to 'state, mode, size, time = dmap[fn]' but not
1303 # This is equivalent to 'state, mode, size, time = dmap[fn]' but not
1304 # written like that for performance reasons. dmap[fn] is not a
1304 # written like that for performance reasons. dmap[fn] is not a
1305 # Python tuple in compiled builds. The CPython UNPACK_SEQUENCE
1305 # Python tuple in compiled builds. The CPython UNPACK_SEQUENCE
1306 # opcode has fast paths when the value to be unpacked is a tuple or
1306 # opcode has fast paths when the value to be unpacked is a tuple or
1307 # a list, but falls back to creating a full-fledged iterator in
1307 # a list, but falls back to creating a full-fledged iterator in
1308 # general. That is much slower than simply accessing and storing the
1308 # general. That is much slower than simply accessing and storing the
1309 # tuple members one by one.
1309 # tuple members one by one.
1310 t = dget(fn)
1310 t = dget(fn)
1311 state = t.state
1311 state = t.state
1312 mode = t[1]
1312 mode = t[1]
1313 size = t[2]
1313 size = t[2]
1314 time = t[3]
1314 time = t[3]
1315
1315
1316 if not st and state in b"nma":
1316 if not st and state in b"nma":
1317 dadd(fn)
1317 dadd(fn)
1318 elif state == b'n':
1318 elif state == b'n':
1319 if (
1319 if (
1320 size >= 0
1320 size >= 0
1321 and (
1321 and (
1322 (size != st.st_size and size != st.st_size & _rangemask)
1322 (size != st.st_size and size != st.st_size & _rangemask)
1323 or ((mode ^ st.st_mode) & 0o100 and checkexec)
1323 or ((mode ^ st.st_mode) & 0o100 and checkexec)
1324 )
1324 )
1325 or t.from_p2
1325 or t.from_p2
1326 or fn in copymap
1326 or fn in copymap
1327 ):
1327 ):
1328 if stat.S_ISLNK(st.st_mode) and size != st.st_size:
1328 if stat.S_ISLNK(st.st_mode) and size != st.st_size:
1329 # issue6456: Size returned may be longer due to
1329 # issue6456: Size returned may be longer due to
1330 # encryption on EXT-4 fscrypt, undecided.
1330 # encryption on EXT-4 fscrypt, undecided.
1331 ladd(fn)
1331 ladd(fn)
1332 else:
1332 else:
1333 madd(fn)
1333 madd(fn)
1334 elif (
1334 elif (
1335 time != st[stat.ST_MTIME]
1335 time != st[stat.ST_MTIME]
1336 and time != st[stat.ST_MTIME] & _rangemask
1336 and time != st[stat.ST_MTIME] & _rangemask
1337 ):
1337 ):
1338 ladd(fn)
1338 ladd(fn)
1339 elif st[stat.ST_MTIME] == lastnormaltime:
1339 elif st[stat.ST_MTIME] == lastnormaltime:
1340 # fn may have just been marked as normal and it may have
1340 # fn may have just been marked as normal and it may have
1341 # changed in the same second without changing its size.
1341 # changed in the same second without changing its size.
1342 # This can happen if we quickly do multiple commits.
1342 # This can happen if we quickly do multiple commits.
1343 # Force lookup, so we don't miss such a racy file change.
1343 # Force lookup, so we don't miss such a racy file change.
1344 ladd(fn)
1344 ladd(fn)
1345 elif listclean:
1345 elif listclean:
1346 cadd(fn)
1346 cadd(fn)
1347 elif t.merged:
1347 elif t.merged:
1348 madd(fn)
1348 madd(fn)
1349 elif state == b'a':
1349 elif t.added:
1350 aadd(fn)
1350 aadd(fn)
1351 elif t.removed:
1351 elif t.removed:
1352 radd(fn)
1352 radd(fn)
1353 status = scmutil.status(
1353 status = scmutil.status(
1354 modified, added, removed, deleted, unknown, ignored, clean
1354 modified, added, removed, deleted, unknown, ignored, clean
1355 )
1355 )
1356 return (lookup, status)
1356 return (lookup, status)
1357
1357
1358 def matches(self, match):
1358 def matches(self, match):
1359 """
1359 """
1360 return files in the dirstate (in whatever state) filtered by match
1360 return files in the dirstate (in whatever state) filtered by match
1361 """
1361 """
1362 dmap = self._map
1362 dmap = self._map
1363 if rustmod is not None:
1363 if rustmod is not None:
1364 dmap = self._map._rustmap
1364 dmap = self._map._rustmap
1365
1365
1366 if match.always():
1366 if match.always():
1367 return dmap.keys()
1367 return dmap.keys()
1368 files = match.files()
1368 files = match.files()
1369 if match.isexact():
1369 if match.isexact():
1370 # fast path -- filter the other way around, since typically files is
1370 # fast path -- filter the other way around, since typically files is
1371 # much smaller than dmap
1371 # much smaller than dmap
1372 return [f for f in files if f in dmap]
1372 return [f for f in files if f in dmap]
1373 if match.prefix() and all(fn in dmap for fn in files):
1373 if match.prefix() and all(fn in dmap for fn in files):
1374 # fast path -- all the values are known to be files, so just return
1374 # fast path -- all the values are known to be files, so just return
1375 # that
1375 # that
1376 return list(files)
1376 return list(files)
1377 return [f for f in dmap if match(f)]
1377 return [f for f in dmap if match(f)]
1378
1378
1379 def _actualfilename(self, tr):
1379 def _actualfilename(self, tr):
1380 if tr:
1380 if tr:
1381 return self._pendingfilename
1381 return self._pendingfilename
1382 else:
1382 else:
1383 return self._filename
1383 return self._filename
1384
1384
1385 def savebackup(self, tr, backupname):
1385 def savebackup(self, tr, backupname):
1386 '''Save current dirstate into backup file'''
1386 '''Save current dirstate into backup file'''
1387 filename = self._actualfilename(tr)
1387 filename = self._actualfilename(tr)
1388 assert backupname != filename
1388 assert backupname != filename
1389
1389
1390 # use '_writedirstate' instead of 'write' to write changes certainly,
1390 # use '_writedirstate' instead of 'write' to write changes certainly,
1391 # because the latter omits writing out if transaction is running.
1391 # because the latter omits writing out if transaction is running.
1392 # output file will be used to create backup of dirstate at this point.
1392 # output file will be used to create backup of dirstate at this point.
1393 if self._dirty or not self._opener.exists(filename):
1393 if self._dirty or not self._opener.exists(filename):
1394 self._writedirstate(
1394 self._writedirstate(
1395 self._opener(filename, b"w", atomictemp=True, checkambig=True)
1395 self._opener(filename, b"w", atomictemp=True, checkambig=True)
1396 )
1396 )
1397
1397
1398 if tr:
1398 if tr:
1399 # ensure that subsequent tr.writepending returns True for
1399 # ensure that subsequent tr.writepending returns True for
1400 # changes written out above, even if dirstate is never
1400 # changes written out above, even if dirstate is never
1401 # changed after this
1401 # changed after this
1402 tr.addfilegenerator(
1402 tr.addfilegenerator(
1403 b'dirstate',
1403 b'dirstate',
1404 (self._filename,),
1404 (self._filename,),
1405 self._writedirstate,
1405 self._writedirstate,
1406 location=b'plain',
1406 location=b'plain',
1407 )
1407 )
1408
1408
1409 # ensure that pending file written above is unlinked at
1409 # ensure that pending file written above is unlinked at
1410 # failure, even if tr.writepending isn't invoked until the
1410 # failure, even if tr.writepending isn't invoked until the
1411 # end of this transaction
1411 # end of this transaction
1412 tr.registertmp(filename, location=b'plain')
1412 tr.registertmp(filename, location=b'plain')
1413
1413
1414 self._opener.tryunlink(backupname)
1414 self._opener.tryunlink(backupname)
1415 # hardlink backup is okay because _writedirstate is always called
1415 # hardlink backup is okay because _writedirstate is always called
1416 # with an "atomictemp=True" file.
1416 # with an "atomictemp=True" file.
1417 util.copyfile(
1417 util.copyfile(
1418 self._opener.join(filename),
1418 self._opener.join(filename),
1419 self._opener.join(backupname),
1419 self._opener.join(backupname),
1420 hardlink=True,
1420 hardlink=True,
1421 )
1421 )
1422
1422
1423 def restorebackup(self, tr, backupname):
1423 def restorebackup(self, tr, backupname):
1424 '''Restore dirstate by backup file'''
1424 '''Restore dirstate by backup file'''
1425 # this "invalidate()" prevents "wlock.release()" from writing
1425 # this "invalidate()" prevents "wlock.release()" from writing
1426 # changes of dirstate out after restoring from backup file
1426 # changes of dirstate out after restoring from backup file
1427 self.invalidate()
1427 self.invalidate()
1428 filename = self._actualfilename(tr)
1428 filename = self._actualfilename(tr)
1429 o = self._opener
1429 o = self._opener
1430 if util.samefile(o.join(backupname), o.join(filename)):
1430 if util.samefile(o.join(backupname), o.join(filename)):
1431 o.unlink(backupname)
1431 o.unlink(backupname)
1432 else:
1432 else:
1433 o.rename(backupname, filename, checkambig=True)
1433 o.rename(backupname, filename, checkambig=True)
1434
1434
1435 def clearbackup(self, tr, backupname):
1435 def clearbackup(self, tr, backupname):
1436 '''Clear backup file'''
1436 '''Clear backup file'''
1437 self._opener.unlink(backupname)
1437 self._opener.unlink(backupname)
@@ -1,542 +1,547 b''
1 # parsers.py - Python implementation of parsers.c
1 # parsers.py - Python implementation of parsers.c
2 #
2 #
3 # Copyright 2009 Olivia Mackall <olivia@selenic.com> and others
3 # Copyright 2009 Olivia Mackall <olivia@selenic.com> and others
4 #
4 #
5 # This software may be used and distributed according to the terms of the
5 # This software may be used and distributed according to the terms of the
6 # GNU General Public License version 2 or any later version.
6 # GNU General Public License version 2 or any later version.
7
7
8 from __future__ import absolute_import
8 from __future__ import absolute_import
9
9
10 import struct
10 import struct
11 import zlib
11 import zlib
12
12
13 from ..node import (
13 from ..node import (
14 nullrev,
14 nullrev,
15 sha1nodeconstants,
15 sha1nodeconstants,
16 )
16 )
17 from .. import (
17 from .. import (
18 error,
18 error,
19 pycompat,
19 pycompat,
20 revlogutils,
20 revlogutils,
21 util,
21 util,
22 )
22 )
23
23
24 from ..revlogutils import nodemap as nodemaputil
24 from ..revlogutils import nodemap as nodemaputil
25 from ..revlogutils import constants as revlog_constants
25 from ..revlogutils import constants as revlog_constants
26
26
27 stringio = pycompat.bytesio
27 stringio = pycompat.bytesio
28
28
29
29
30 _pack = struct.pack
30 _pack = struct.pack
31 _unpack = struct.unpack
31 _unpack = struct.unpack
32 _compress = zlib.compress
32 _compress = zlib.compress
33 _decompress = zlib.decompress
33 _decompress = zlib.decompress
34
34
35
35
36 # a special value used internally for `size` if the file come from the other parent
36 # a special value used internally for `size` if the file come from the other parent
37 FROM_P2 = -2
37 FROM_P2 = -2
38
38
39 # a special value used internally for `size` if the file is modified/merged/added
39 # a special value used internally for `size` if the file is modified/merged/added
40 NONNORMAL = -1
40 NONNORMAL = -1
41
41
42
42
43 class dirstatetuple(object):
43 class dirstatetuple(object):
44 """represent a dirstate entry
44 """represent a dirstate entry
45
45
46 It contains:
46 It contains:
47
47
48 - state (one of 'n', 'a', 'r', 'm')
48 - state (one of 'n', 'a', 'r', 'm')
49 - mode,
49 - mode,
50 - size,
50 - size,
51 - mtime,
51 - mtime,
52 """
52 """
53
53
54 __slot__ = ('_state', '_mode', '_size', '_mtime')
54 __slot__ = ('_state', '_mode', '_size', '_mtime')
55
55
56 def __init__(self, state, mode, size, mtime):
56 def __init__(self, state, mode, size, mtime):
57 self._state = state
57 self._state = state
58 self._mode = mode
58 self._mode = mode
59 self._size = size
59 self._size = size
60 self._mtime = mtime
60 self._mtime = mtime
61
61
62 def __getitem__(self, idx):
62 def __getitem__(self, idx):
63 if idx == 0 or idx == -4:
63 if idx == 0 or idx == -4:
64 return self._state
64 return self._state
65 elif idx == 1 or idx == -3:
65 elif idx == 1 or idx == -3:
66 return self._mode
66 return self._mode
67 elif idx == 2 or idx == -2:
67 elif idx == 2 or idx == -2:
68 return self._size
68 return self._size
69 elif idx == 3 or idx == -1:
69 elif idx == 3 or idx == -1:
70 return self._mtime
70 return self._mtime
71 else:
71 else:
72 raise IndexError(idx)
72 raise IndexError(idx)
73
73
74 @property
74 @property
75 def state(self):
75 def state(self):
76 """
76 """
77 States are:
77 States are:
78 n normal
78 n normal
79 m needs merging
79 m needs merging
80 r marked for removal
80 r marked for removal
81 a marked for addition
81 a marked for addition
82
82
83 XXX This "state" is a bit obscure and mostly a direct expression of the
83 XXX This "state" is a bit obscure and mostly a direct expression of the
84 dirstatev1 format. It would make sense to ultimately deprecate it in
84 dirstatev1 format. It would make sense to ultimately deprecate it in
85 favor of the more "semantic" attributes.
85 favor of the more "semantic" attributes.
86 """
86 """
87 return self._state
87 return self._state
88
88
89 @property
89 @property
90 def added(self):
91 """True if the file has been added"""
92 return self._state == b'a'
93
94 @property
90 def merged(self):
95 def merged(self):
91 """True if the file has been merged
96 """True if the file has been merged
92
97
93 Should only be set if a merge is in progress in the dirstate
98 Should only be set if a merge is in progress in the dirstate
94 """
99 """
95 return self._state == b'm'
100 return self._state == b'm'
96
101
97 @property
102 @property
98 def from_p2(self):
103 def from_p2(self):
99 """True if the file have been fetched from p2 during the current merge
104 """True if the file have been fetched from p2 during the current merge
100
105
101 This is only True is the file is currently tracked.
106 This is only True is the file is currently tracked.
102
107
103 Should only be set if a merge is in progress in the dirstate
108 Should only be set if a merge is in progress in the dirstate
104 """
109 """
105 return self._state == b'n' and self._size == FROM_P2
110 return self._state == b'n' and self._size == FROM_P2
106
111
107 @property
112 @property
108 def from_p2_removed(self):
113 def from_p2_removed(self):
109 """True if the file has been removed, but was "from_p2" initially
114 """True if the file has been removed, but was "from_p2" initially
110
115
111 This property seems like an abstraction leakage and should probably be
116 This property seems like an abstraction leakage and should probably be
112 dealt in this class (or maybe the dirstatemap) directly.
117 dealt in this class (or maybe the dirstatemap) directly.
113 """
118 """
114 return self._state == b'r' and self._size == FROM_P2
119 return self._state == b'r' and self._size == FROM_P2
115
120
116 @property
121 @property
117 def removed(self):
122 def removed(self):
118 """True if the file has been removed"""
123 """True if the file has been removed"""
119 return self._state == b'r'
124 return self._state == b'r'
120
125
121 @property
126 @property
122 def merged_removed(self):
127 def merged_removed(self):
123 """True if the file has been removed, but was "merged" initially
128 """True if the file has been removed, but was "merged" initially
124
129
125 This property seems like an abstraction leakage and should probably be
130 This property seems like an abstraction leakage and should probably be
126 dealt in this class (or maybe the dirstatemap) directly.
131 dealt in this class (or maybe the dirstatemap) directly.
127 """
132 """
128 return self._state == b'r' and self._size == NONNORMAL
133 return self._state == b'r' and self._size == NONNORMAL
129
134
130 def v1_state(self):
135 def v1_state(self):
131 """return a "state" suitable for v1 serialization"""
136 """return a "state" suitable for v1 serialization"""
132 return self._state
137 return self._state
133
138
134 def v1_mode(self):
139 def v1_mode(self):
135 """return a "mode" suitable for v1 serialization"""
140 """return a "mode" suitable for v1 serialization"""
136 return self._mode
141 return self._mode
137
142
138 def v1_size(self):
143 def v1_size(self):
139 """return a "size" suitable for v1 serialization"""
144 """return a "size" suitable for v1 serialization"""
140 return self._size
145 return self._size
141
146
142 def v1_mtime(self):
147 def v1_mtime(self):
143 """return a "mtime" suitable for v1 serialization"""
148 """return a "mtime" suitable for v1 serialization"""
144 return self._mtime
149 return self._mtime
145
150
146
151
147 def gettype(q):
152 def gettype(q):
148 return int(q & 0xFFFF)
153 return int(q & 0xFFFF)
149
154
150
155
151 class BaseIndexObject(object):
156 class BaseIndexObject(object):
152 # Can I be passed to an algorithme implemented in Rust ?
157 # Can I be passed to an algorithme implemented in Rust ?
153 rust_ext_compat = 0
158 rust_ext_compat = 0
154 # Format of an index entry according to Python's `struct` language
159 # Format of an index entry according to Python's `struct` language
155 index_format = revlog_constants.INDEX_ENTRY_V1
160 index_format = revlog_constants.INDEX_ENTRY_V1
156 # Size of a C unsigned long long int, platform independent
161 # Size of a C unsigned long long int, platform independent
157 big_int_size = struct.calcsize(b'>Q')
162 big_int_size = struct.calcsize(b'>Q')
158 # Size of a C long int, platform independent
163 # Size of a C long int, platform independent
159 int_size = struct.calcsize(b'>i')
164 int_size = struct.calcsize(b'>i')
160 # An empty index entry, used as a default value to be overridden, or nullrev
165 # An empty index entry, used as a default value to be overridden, or nullrev
161 null_item = (
166 null_item = (
162 0,
167 0,
163 0,
168 0,
164 0,
169 0,
165 -1,
170 -1,
166 -1,
171 -1,
167 -1,
172 -1,
168 -1,
173 -1,
169 sha1nodeconstants.nullid,
174 sha1nodeconstants.nullid,
170 0,
175 0,
171 0,
176 0,
172 revlog_constants.COMP_MODE_INLINE,
177 revlog_constants.COMP_MODE_INLINE,
173 revlog_constants.COMP_MODE_INLINE,
178 revlog_constants.COMP_MODE_INLINE,
174 )
179 )
175
180
176 @util.propertycache
181 @util.propertycache
177 def entry_size(self):
182 def entry_size(self):
178 return self.index_format.size
183 return self.index_format.size
179
184
180 @property
185 @property
181 def nodemap(self):
186 def nodemap(self):
182 msg = b"index.nodemap is deprecated, use index.[has_node|rev|get_rev]"
187 msg = b"index.nodemap is deprecated, use index.[has_node|rev|get_rev]"
183 util.nouideprecwarn(msg, b'5.3', stacklevel=2)
188 util.nouideprecwarn(msg, b'5.3', stacklevel=2)
184 return self._nodemap
189 return self._nodemap
185
190
186 @util.propertycache
191 @util.propertycache
187 def _nodemap(self):
192 def _nodemap(self):
188 nodemap = nodemaputil.NodeMap({sha1nodeconstants.nullid: nullrev})
193 nodemap = nodemaputil.NodeMap({sha1nodeconstants.nullid: nullrev})
189 for r in range(0, len(self)):
194 for r in range(0, len(self)):
190 n = self[r][7]
195 n = self[r][7]
191 nodemap[n] = r
196 nodemap[n] = r
192 return nodemap
197 return nodemap
193
198
194 def has_node(self, node):
199 def has_node(self, node):
195 """return True if the node exist in the index"""
200 """return True if the node exist in the index"""
196 return node in self._nodemap
201 return node in self._nodemap
197
202
198 def rev(self, node):
203 def rev(self, node):
199 """return a revision for a node
204 """return a revision for a node
200
205
201 If the node is unknown, raise a RevlogError"""
206 If the node is unknown, raise a RevlogError"""
202 return self._nodemap[node]
207 return self._nodemap[node]
203
208
204 def get_rev(self, node):
209 def get_rev(self, node):
205 """return a revision for a node
210 """return a revision for a node
206
211
207 If the node is unknown, return None"""
212 If the node is unknown, return None"""
208 return self._nodemap.get(node)
213 return self._nodemap.get(node)
209
214
210 def _stripnodes(self, start):
215 def _stripnodes(self, start):
211 if '_nodemap' in vars(self):
216 if '_nodemap' in vars(self):
212 for r in range(start, len(self)):
217 for r in range(start, len(self)):
213 n = self[r][7]
218 n = self[r][7]
214 del self._nodemap[n]
219 del self._nodemap[n]
215
220
216 def clearcaches(self):
221 def clearcaches(self):
217 self.__dict__.pop('_nodemap', None)
222 self.__dict__.pop('_nodemap', None)
218
223
219 def __len__(self):
224 def __len__(self):
220 return self._lgt + len(self._extra)
225 return self._lgt + len(self._extra)
221
226
222 def append(self, tup):
227 def append(self, tup):
223 if '_nodemap' in vars(self):
228 if '_nodemap' in vars(self):
224 self._nodemap[tup[7]] = len(self)
229 self._nodemap[tup[7]] = len(self)
225 data = self._pack_entry(len(self), tup)
230 data = self._pack_entry(len(self), tup)
226 self._extra.append(data)
231 self._extra.append(data)
227
232
228 def _pack_entry(self, rev, entry):
233 def _pack_entry(self, rev, entry):
229 assert entry[8] == 0
234 assert entry[8] == 0
230 assert entry[9] == 0
235 assert entry[9] == 0
231 return self.index_format.pack(*entry[:8])
236 return self.index_format.pack(*entry[:8])
232
237
233 def _check_index(self, i):
238 def _check_index(self, i):
234 if not isinstance(i, int):
239 if not isinstance(i, int):
235 raise TypeError(b"expecting int indexes")
240 raise TypeError(b"expecting int indexes")
236 if i < 0 or i >= len(self):
241 if i < 0 or i >= len(self):
237 raise IndexError
242 raise IndexError
238
243
239 def __getitem__(self, i):
244 def __getitem__(self, i):
240 if i == -1:
245 if i == -1:
241 return self.null_item
246 return self.null_item
242 self._check_index(i)
247 self._check_index(i)
243 if i >= self._lgt:
248 if i >= self._lgt:
244 data = self._extra[i - self._lgt]
249 data = self._extra[i - self._lgt]
245 else:
250 else:
246 index = self._calculate_index(i)
251 index = self._calculate_index(i)
247 data = self._data[index : index + self.entry_size]
252 data = self._data[index : index + self.entry_size]
248 r = self._unpack_entry(i, data)
253 r = self._unpack_entry(i, data)
249 if self._lgt and i == 0:
254 if self._lgt and i == 0:
250 offset = revlogutils.offset_type(0, gettype(r[0]))
255 offset = revlogutils.offset_type(0, gettype(r[0]))
251 r = (offset,) + r[1:]
256 r = (offset,) + r[1:]
252 return r
257 return r
253
258
254 def _unpack_entry(self, rev, data):
259 def _unpack_entry(self, rev, data):
255 r = self.index_format.unpack(data)
260 r = self.index_format.unpack(data)
256 r = r + (
261 r = r + (
257 0,
262 0,
258 0,
263 0,
259 revlog_constants.COMP_MODE_INLINE,
264 revlog_constants.COMP_MODE_INLINE,
260 revlog_constants.COMP_MODE_INLINE,
265 revlog_constants.COMP_MODE_INLINE,
261 )
266 )
262 return r
267 return r
263
268
264 def pack_header(self, header):
269 def pack_header(self, header):
265 """pack header information as binary"""
270 """pack header information as binary"""
266 v_fmt = revlog_constants.INDEX_HEADER
271 v_fmt = revlog_constants.INDEX_HEADER
267 return v_fmt.pack(header)
272 return v_fmt.pack(header)
268
273
269 def entry_binary(self, rev):
274 def entry_binary(self, rev):
270 """return the raw binary string representing a revision"""
275 """return the raw binary string representing a revision"""
271 entry = self[rev]
276 entry = self[rev]
272 p = revlog_constants.INDEX_ENTRY_V1.pack(*entry[:8])
277 p = revlog_constants.INDEX_ENTRY_V1.pack(*entry[:8])
273 if rev == 0:
278 if rev == 0:
274 p = p[revlog_constants.INDEX_HEADER.size :]
279 p = p[revlog_constants.INDEX_HEADER.size :]
275 return p
280 return p
276
281
277
282
278 class IndexObject(BaseIndexObject):
283 class IndexObject(BaseIndexObject):
279 def __init__(self, data):
284 def __init__(self, data):
280 assert len(data) % self.entry_size == 0, (
285 assert len(data) % self.entry_size == 0, (
281 len(data),
286 len(data),
282 self.entry_size,
287 self.entry_size,
283 len(data) % self.entry_size,
288 len(data) % self.entry_size,
284 )
289 )
285 self._data = data
290 self._data = data
286 self._lgt = len(data) // self.entry_size
291 self._lgt = len(data) // self.entry_size
287 self._extra = []
292 self._extra = []
288
293
289 def _calculate_index(self, i):
294 def _calculate_index(self, i):
290 return i * self.entry_size
295 return i * self.entry_size
291
296
292 def __delitem__(self, i):
297 def __delitem__(self, i):
293 if not isinstance(i, slice) or not i.stop == -1 or i.step is not None:
298 if not isinstance(i, slice) or not i.stop == -1 or i.step is not None:
294 raise ValueError(b"deleting slices only supports a:-1 with step 1")
299 raise ValueError(b"deleting slices only supports a:-1 with step 1")
295 i = i.start
300 i = i.start
296 self._check_index(i)
301 self._check_index(i)
297 self._stripnodes(i)
302 self._stripnodes(i)
298 if i < self._lgt:
303 if i < self._lgt:
299 self._data = self._data[: i * self.entry_size]
304 self._data = self._data[: i * self.entry_size]
300 self._lgt = i
305 self._lgt = i
301 self._extra = []
306 self._extra = []
302 else:
307 else:
303 self._extra = self._extra[: i - self._lgt]
308 self._extra = self._extra[: i - self._lgt]
304
309
305
310
306 class PersistentNodeMapIndexObject(IndexObject):
311 class PersistentNodeMapIndexObject(IndexObject):
307 """a Debug oriented class to test persistent nodemap
312 """a Debug oriented class to test persistent nodemap
308
313
309 We need a simple python object to test API and higher level behavior. See
314 We need a simple python object to test API and higher level behavior. See
310 the Rust implementation for more serious usage. This should be used only
315 the Rust implementation for more serious usage. This should be used only
311 through the dedicated `devel.persistent-nodemap` config.
316 through the dedicated `devel.persistent-nodemap` config.
312 """
317 """
313
318
314 def nodemap_data_all(self):
319 def nodemap_data_all(self):
315 """Return bytes containing a full serialization of a nodemap
320 """Return bytes containing a full serialization of a nodemap
316
321
317 The nodemap should be valid for the full set of revisions in the
322 The nodemap should be valid for the full set of revisions in the
318 index."""
323 index."""
319 return nodemaputil.persistent_data(self)
324 return nodemaputil.persistent_data(self)
320
325
321 def nodemap_data_incremental(self):
326 def nodemap_data_incremental(self):
322 """Return bytes containing a incremental update to persistent nodemap
327 """Return bytes containing a incremental update to persistent nodemap
323
328
324 This containst the data for an append-only update of the data provided
329 This containst the data for an append-only update of the data provided
325 in the last call to `update_nodemap_data`.
330 in the last call to `update_nodemap_data`.
326 """
331 """
327 if self._nm_root is None:
332 if self._nm_root is None:
328 return None
333 return None
329 docket = self._nm_docket
334 docket = self._nm_docket
330 changed, data = nodemaputil.update_persistent_data(
335 changed, data = nodemaputil.update_persistent_data(
331 self, self._nm_root, self._nm_max_idx, self._nm_docket.tip_rev
336 self, self._nm_root, self._nm_max_idx, self._nm_docket.tip_rev
332 )
337 )
333
338
334 self._nm_root = self._nm_max_idx = self._nm_docket = None
339 self._nm_root = self._nm_max_idx = self._nm_docket = None
335 return docket, changed, data
340 return docket, changed, data
336
341
337 def update_nodemap_data(self, docket, nm_data):
342 def update_nodemap_data(self, docket, nm_data):
338 """provide full block of persisted binary data for a nodemap
343 """provide full block of persisted binary data for a nodemap
339
344
340 The data are expected to come from disk. See `nodemap_data_all` for a
345 The data are expected to come from disk. See `nodemap_data_all` for a
341 produceur of such data."""
346 produceur of such data."""
342 if nm_data is not None:
347 if nm_data is not None:
343 self._nm_root, self._nm_max_idx = nodemaputil.parse_data(nm_data)
348 self._nm_root, self._nm_max_idx = nodemaputil.parse_data(nm_data)
344 if self._nm_root:
349 if self._nm_root:
345 self._nm_docket = docket
350 self._nm_docket = docket
346 else:
351 else:
347 self._nm_root = self._nm_max_idx = self._nm_docket = None
352 self._nm_root = self._nm_max_idx = self._nm_docket = None
348
353
349
354
350 class InlinedIndexObject(BaseIndexObject):
355 class InlinedIndexObject(BaseIndexObject):
351 def __init__(self, data, inline=0):
356 def __init__(self, data, inline=0):
352 self._data = data
357 self._data = data
353 self._lgt = self._inline_scan(None)
358 self._lgt = self._inline_scan(None)
354 self._inline_scan(self._lgt)
359 self._inline_scan(self._lgt)
355 self._extra = []
360 self._extra = []
356
361
357 def _inline_scan(self, lgt):
362 def _inline_scan(self, lgt):
358 off = 0
363 off = 0
359 if lgt is not None:
364 if lgt is not None:
360 self._offsets = [0] * lgt
365 self._offsets = [0] * lgt
361 count = 0
366 count = 0
362 while off <= len(self._data) - self.entry_size:
367 while off <= len(self._data) - self.entry_size:
363 start = off + self.big_int_size
368 start = off + self.big_int_size
364 (s,) = struct.unpack(
369 (s,) = struct.unpack(
365 b'>i',
370 b'>i',
366 self._data[start : start + self.int_size],
371 self._data[start : start + self.int_size],
367 )
372 )
368 if lgt is not None:
373 if lgt is not None:
369 self._offsets[count] = off
374 self._offsets[count] = off
370 count += 1
375 count += 1
371 off += self.entry_size + s
376 off += self.entry_size + s
372 if off != len(self._data):
377 if off != len(self._data):
373 raise ValueError(b"corrupted data")
378 raise ValueError(b"corrupted data")
374 return count
379 return count
375
380
376 def __delitem__(self, i):
381 def __delitem__(self, i):
377 if not isinstance(i, slice) or not i.stop == -1 or i.step is not None:
382 if not isinstance(i, slice) or not i.stop == -1 or i.step is not None:
378 raise ValueError(b"deleting slices only supports a:-1 with step 1")
383 raise ValueError(b"deleting slices only supports a:-1 with step 1")
379 i = i.start
384 i = i.start
380 self._check_index(i)
385 self._check_index(i)
381 self._stripnodes(i)
386 self._stripnodes(i)
382 if i < self._lgt:
387 if i < self._lgt:
383 self._offsets = self._offsets[:i]
388 self._offsets = self._offsets[:i]
384 self._lgt = i
389 self._lgt = i
385 self._extra = []
390 self._extra = []
386 else:
391 else:
387 self._extra = self._extra[: i - self._lgt]
392 self._extra = self._extra[: i - self._lgt]
388
393
389 def _calculate_index(self, i):
394 def _calculate_index(self, i):
390 return self._offsets[i]
395 return self._offsets[i]
391
396
392
397
393 def parse_index2(data, inline, revlogv2=False):
398 def parse_index2(data, inline, revlogv2=False):
394 if not inline:
399 if not inline:
395 cls = IndexObject2 if revlogv2 else IndexObject
400 cls = IndexObject2 if revlogv2 else IndexObject
396 return cls(data), None
401 return cls(data), None
397 cls = InlinedIndexObject
402 cls = InlinedIndexObject
398 return cls(data, inline), (0, data)
403 return cls(data, inline), (0, data)
399
404
400
405
401 def parse_index_cl_v2(data):
406 def parse_index_cl_v2(data):
402 return IndexChangelogV2(data), None
407 return IndexChangelogV2(data), None
403
408
404
409
405 class IndexObject2(IndexObject):
410 class IndexObject2(IndexObject):
406 index_format = revlog_constants.INDEX_ENTRY_V2
411 index_format = revlog_constants.INDEX_ENTRY_V2
407
412
408 def replace_sidedata_info(
413 def replace_sidedata_info(
409 self,
414 self,
410 rev,
415 rev,
411 sidedata_offset,
416 sidedata_offset,
412 sidedata_length,
417 sidedata_length,
413 offset_flags,
418 offset_flags,
414 compression_mode,
419 compression_mode,
415 ):
420 ):
416 """
421 """
417 Replace an existing index entry's sidedata offset and length with new
422 Replace an existing index entry's sidedata offset and length with new
418 ones.
423 ones.
419 This cannot be used outside of the context of sidedata rewriting,
424 This cannot be used outside of the context of sidedata rewriting,
420 inside the transaction that creates the revision `rev`.
425 inside the transaction that creates the revision `rev`.
421 """
426 """
422 if rev < 0:
427 if rev < 0:
423 raise KeyError
428 raise KeyError
424 self._check_index(rev)
429 self._check_index(rev)
425 if rev < self._lgt:
430 if rev < self._lgt:
426 msg = b"cannot rewrite entries outside of this transaction"
431 msg = b"cannot rewrite entries outside of this transaction"
427 raise KeyError(msg)
432 raise KeyError(msg)
428 else:
433 else:
429 entry = list(self[rev])
434 entry = list(self[rev])
430 entry[0] = offset_flags
435 entry[0] = offset_flags
431 entry[8] = sidedata_offset
436 entry[8] = sidedata_offset
432 entry[9] = sidedata_length
437 entry[9] = sidedata_length
433 entry[11] = compression_mode
438 entry[11] = compression_mode
434 entry = tuple(entry)
439 entry = tuple(entry)
435 new = self._pack_entry(rev, entry)
440 new = self._pack_entry(rev, entry)
436 self._extra[rev - self._lgt] = new
441 self._extra[rev - self._lgt] = new
437
442
438 def _unpack_entry(self, rev, data):
443 def _unpack_entry(self, rev, data):
439 data = self.index_format.unpack(data)
444 data = self.index_format.unpack(data)
440 entry = data[:10]
445 entry = data[:10]
441 data_comp = data[10] & 3
446 data_comp = data[10] & 3
442 sidedata_comp = (data[10] & (3 << 2)) >> 2
447 sidedata_comp = (data[10] & (3 << 2)) >> 2
443 return entry + (data_comp, sidedata_comp)
448 return entry + (data_comp, sidedata_comp)
444
449
445 def _pack_entry(self, rev, entry):
450 def _pack_entry(self, rev, entry):
446 data = entry[:10]
451 data = entry[:10]
447 data_comp = entry[10] & 3
452 data_comp = entry[10] & 3
448 sidedata_comp = (entry[11] & 3) << 2
453 sidedata_comp = (entry[11] & 3) << 2
449 data += (data_comp | sidedata_comp,)
454 data += (data_comp | sidedata_comp,)
450
455
451 return self.index_format.pack(*data)
456 return self.index_format.pack(*data)
452
457
453 def entry_binary(self, rev):
458 def entry_binary(self, rev):
454 """return the raw binary string representing a revision"""
459 """return the raw binary string representing a revision"""
455 entry = self[rev]
460 entry = self[rev]
456 return self._pack_entry(rev, entry)
461 return self._pack_entry(rev, entry)
457
462
458 def pack_header(self, header):
463 def pack_header(self, header):
459 """pack header information as binary"""
464 """pack header information as binary"""
460 msg = 'version header should go in the docket, not the index: %d'
465 msg = 'version header should go in the docket, not the index: %d'
461 msg %= header
466 msg %= header
462 raise error.ProgrammingError(msg)
467 raise error.ProgrammingError(msg)
463
468
464
469
465 class IndexChangelogV2(IndexObject2):
470 class IndexChangelogV2(IndexObject2):
466 index_format = revlog_constants.INDEX_ENTRY_CL_V2
471 index_format = revlog_constants.INDEX_ENTRY_CL_V2
467
472
468 def _unpack_entry(self, rev, data, r=True):
473 def _unpack_entry(self, rev, data, r=True):
469 items = self.index_format.unpack(data)
474 items = self.index_format.unpack(data)
470 entry = items[:3] + (rev, rev) + items[3:8]
475 entry = items[:3] + (rev, rev) + items[3:8]
471 data_comp = items[8] & 3
476 data_comp = items[8] & 3
472 sidedata_comp = (items[8] >> 2) & 3
477 sidedata_comp = (items[8] >> 2) & 3
473 return entry + (data_comp, sidedata_comp)
478 return entry + (data_comp, sidedata_comp)
474
479
475 def _pack_entry(self, rev, entry):
480 def _pack_entry(self, rev, entry):
476 assert entry[3] == rev, entry[3]
481 assert entry[3] == rev, entry[3]
477 assert entry[4] == rev, entry[4]
482 assert entry[4] == rev, entry[4]
478 data = entry[:3] + entry[5:10]
483 data = entry[:3] + entry[5:10]
479 data_comp = entry[10] & 3
484 data_comp = entry[10] & 3
480 sidedata_comp = (entry[11] & 3) << 2
485 sidedata_comp = (entry[11] & 3) << 2
481 data += (data_comp | sidedata_comp,)
486 data += (data_comp | sidedata_comp,)
482 return self.index_format.pack(*data)
487 return self.index_format.pack(*data)
483
488
484
489
485 def parse_index_devel_nodemap(data, inline):
490 def parse_index_devel_nodemap(data, inline):
486 """like parse_index2, but alway return a PersistentNodeMapIndexObject"""
491 """like parse_index2, but alway return a PersistentNodeMapIndexObject"""
487 return PersistentNodeMapIndexObject(data), None
492 return PersistentNodeMapIndexObject(data), None
488
493
489
494
490 def parse_dirstate(dmap, copymap, st):
495 def parse_dirstate(dmap, copymap, st):
491 parents = [st[:20], st[20:40]]
496 parents = [st[:20], st[20:40]]
492 # dereference fields so they will be local in loop
497 # dereference fields so they will be local in loop
493 format = b">cllll"
498 format = b">cllll"
494 e_size = struct.calcsize(format)
499 e_size = struct.calcsize(format)
495 pos1 = 40
500 pos1 = 40
496 l = len(st)
501 l = len(st)
497
502
498 # the inner loop
503 # the inner loop
499 while pos1 < l:
504 while pos1 < l:
500 pos2 = pos1 + e_size
505 pos2 = pos1 + e_size
501 e = _unpack(b">cllll", st[pos1:pos2]) # a literal here is faster
506 e = _unpack(b">cllll", st[pos1:pos2]) # a literal here is faster
502 pos1 = pos2 + e[4]
507 pos1 = pos2 + e[4]
503 f = st[pos2:pos1]
508 f = st[pos2:pos1]
504 if b'\0' in f:
509 if b'\0' in f:
505 f, c = f.split(b'\0')
510 f, c = f.split(b'\0')
506 copymap[f] = c
511 copymap[f] = c
507 dmap[f] = dirstatetuple(*e[:4])
512 dmap[f] = dirstatetuple(*e[:4])
508 return parents
513 return parents
509
514
510
515
511 def pack_dirstate(dmap, copymap, pl, now):
516 def pack_dirstate(dmap, copymap, pl, now):
512 now = int(now)
517 now = int(now)
513 cs = stringio()
518 cs = stringio()
514 write = cs.write
519 write = cs.write
515 write(b"".join(pl))
520 write(b"".join(pl))
516 for f, e in pycompat.iteritems(dmap):
521 for f, e in pycompat.iteritems(dmap):
517 if e[0] == b'n' and e[3] == now:
522 if e[0] == b'n' and e[3] == now:
518 # The file was last modified "simultaneously" with the current
523 # The file was last modified "simultaneously" with the current
519 # write to dirstate (i.e. within the same second for file-
524 # write to dirstate (i.e. within the same second for file-
520 # systems with a granularity of 1 sec). This commonly happens
525 # systems with a granularity of 1 sec). This commonly happens
521 # for at least a couple of files on 'update'.
526 # for at least a couple of files on 'update'.
522 # The user could change the file without changing its size
527 # The user could change the file without changing its size
523 # within the same second. Invalidate the file's mtime in
528 # within the same second. Invalidate the file's mtime in
524 # dirstate, forcing future 'status' calls to compare the
529 # dirstate, forcing future 'status' calls to compare the
525 # contents of the file if the size is the same. This prevents
530 # contents of the file if the size is the same. This prevents
526 # mistakenly treating such files as clean.
531 # mistakenly treating such files as clean.
527 e = dirstatetuple(e[0], e[1], e[2], -1)
532 e = dirstatetuple(e[0], e[1], e[2], -1)
528 dmap[f] = e
533 dmap[f] = e
529
534
530 if f in copymap:
535 if f in copymap:
531 f = b"%s\0%s" % (f, copymap[f])
536 f = b"%s\0%s" % (f, copymap[f])
532 e = _pack(
537 e = _pack(
533 b">cllll",
538 b">cllll",
534 e.v1_state(),
539 e.v1_state(),
535 e.v1_mode(),
540 e.v1_mode(),
536 e.v1_size(),
541 e.v1_size(),
537 e.v1_mtime(),
542 e.v1_mtime(),
538 len(f),
543 len(f),
539 )
544 )
540 write(e)
545 write(e)
541 write(f)
546 write(f)
542 return cs.getvalue()
547 return cs.getvalue()
General Comments 0
You need to be logged in to leave comments. Login now