Show More
@@ -1,560 +1,594 b'' | |||||
1 | The *dirstate* is what Mercurial uses internally to track |
|
1 | The *dirstate* is what Mercurial uses internally to track | |
2 | the state of files in the working directory, |
|
2 | the state of files in the working directory, | |
3 | such as set by commands like `hg add` and `hg rm`. |
|
3 | such as set by commands like `hg add` and `hg rm`. | |
4 | It also contains some cached data that help make `hg status` faster. |
|
4 | It also contains some cached data that help make `hg status` faster. | |
5 | The name refers both to `.hg/dirstate` on the filesystem |
|
5 | The name refers both to `.hg/dirstate` on the filesystem | |
6 | and the corresponding data structure in memory while a Mercurial process |
|
6 | and the corresponding data structure in memory while a Mercurial process | |
7 | is running. |
|
7 | is running. | |
8 |
|
8 | |||
9 | The original file format, retroactively dubbed `dirstate-v1`, |
|
9 | The original file format, retroactively dubbed `dirstate-v1`, | |
10 | is described at https://www.mercurial-scm.org/wiki/DirState. |
|
10 | is described at https://www.mercurial-scm.org/wiki/DirState. | |
11 | It is made of a flat sequence of unordered variable-size entries, |
|
11 | It is made of a flat sequence of unordered variable-size entries, | |
12 | so accessing any information in it requires parsing all of it. |
|
12 | so accessing any information in it requires parsing all of it. | |
13 | Similarly, saving changes requires rewriting the entire file. |
|
13 | Similarly, saving changes requires rewriting the entire file. | |
14 |
|
14 | |||
15 | The newer `dirsate-v2` file format is designed to fix these limitations |
|
15 | The newer `dirsate-v2` file format is designed to fix these limitations | |
16 | and make `hg status` faster. |
|
16 | and make `hg status` faster. | |
17 |
|
17 | |||
18 | User guide |
|
18 | User guide | |
19 | ========== |
|
19 | ========== | |
20 |
|
20 | |||
21 | Compatibility |
|
21 | Compatibility | |
22 | ------------- |
|
22 | ------------- | |
23 |
|
23 | |||
24 | The file format is experimental and may still change. |
|
24 | The file format is experimental and may still change. | |
25 | Different versions of Mercurial may not be compatible with each other |
|
25 | Different versions of Mercurial may not be compatible with each other | |
26 | when working on a local repository that uses this format. |
|
26 | when working on a local repository that uses this format. | |
27 | When using an incompatible version with the experimental format, |
|
27 | When using an incompatible version with the experimental format, | |
28 | anything can happen including data corruption. |
|
28 | anything can happen including data corruption. | |
29 |
|
29 | |||
30 | Since the dirstate is entirely local and not relevant to the wire protocol, |
|
30 | Since the dirstate is entirely local and not relevant to the wire protocol, | |
31 | `dirstate-v2` does not affect compatibility with remote Mercurial versions. |
|
31 | `dirstate-v2` does not affect compatibility with remote Mercurial versions. | |
32 |
|
32 | |||
33 | When `share-safe` is enabled, different repositories sharing the same store |
|
33 | When `share-safe` is enabled, different repositories sharing the same store | |
34 | can use different dirstate formats. |
|
34 | can use different dirstate formats. | |
35 |
|
35 | |||
36 | Enabling `dirsate-v2` for new local repositories |
|
36 | Enabling `dirsate-v2` for new local repositories | |
37 | ------------------------------------------------ |
|
37 | ------------------------------------------------ | |
38 |
|
38 | |||
39 | When creating a new local repository such as with `hg init` or `hg clone`, |
|
39 | When creating a new local repository such as with `hg init` or `hg clone`, | |
40 | the `exp-dirstate-v2` boolean in the `format` configuration section |
|
40 | the `exp-dirstate-v2` boolean in the `format` configuration section | |
41 | controls whether to use this file format. |
|
41 | controls whether to use this file format. | |
42 | This is disabled by default as of this writing. |
|
42 | This is disabled by default as of this writing. | |
43 | To enable it for a single repository, run for example:: |
|
43 | To enable it for a single repository, run for example:: | |
44 |
|
44 | |||
45 | $ hg init my-project --config format.exp-dirstate-v2=1 |
|
45 | $ hg init my-project --config format.exp-dirstate-v2=1 | |
46 |
|
46 | |||
47 | Checking the format of an existing local repsitory |
|
47 | Checking the format of an existing local repsitory | |
48 | -------------------------------------------------- |
|
48 | -------------------------------------------------- | |
49 |
|
49 | |||
50 | The `debugformat` commands prints information about |
|
50 | The `debugformat` commands prints information about | |
51 | which of multiple optional formats are used in the current repository, |
|
51 | which of multiple optional formats are used in the current repository, | |
52 | including `dirstate-v2`:: |
|
52 | including `dirstate-v2`:: | |
53 |
|
53 | |||
54 | $ hg debugformat |
|
54 | $ hg debugformat | |
55 | format-variant repo |
|
55 | format-variant repo | |
56 | fncache: yes |
|
56 | fncache: yes | |
57 | dirstate-v2: yes |
|
57 | dirstate-v2: yes | |
58 | [β¦] |
|
58 | [β¦] | |
59 |
|
59 | |||
60 | Upgrading or downgrading an existing local repository |
|
60 | Upgrading or downgrading an existing local repository | |
61 | ----------------------------------------------------- |
|
61 | ----------------------------------------------------- | |
62 |
|
62 | |||
63 | The `debugupgrade` command does various upgrades or downgrades |
|
63 | The `debugupgrade` command does various upgrades or downgrades | |
64 | on a local repository |
|
64 | on a local repository | |
65 | based on the current Mercurial version and on configuration. |
|
65 | based on the current Mercurial version and on configuration. | |
66 | The same `format.exp-dirstate-v2` configuration is used again. |
|
66 | The same `format.exp-dirstate-v2` configuration is used again. | |
67 |
|
67 | |||
68 | Example to upgrade:: |
|
68 | Example to upgrade:: | |
69 |
|
69 | |||
70 | $ hg debugupgrade --config format.exp-dirstate-v2=1 |
|
70 | $ hg debugupgrade --config format.exp-dirstate-v2=1 | |
71 |
|
71 | |||
72 | Example to downgrade to `dirstate-v1`:: |
|
72 | Example to downgrade to `dirstate-v1`:: | |
73 |
|
73 | |||
74 | $ hg debugupgrade --config format.exp-dirstate-v2=0 |
|
74 | $ hg debugupgrade --config format.exp-dirstate-v2=0 | |
75 |
|
75 | |||
76 | Both of this commands do nothing but print a list of proposed changes, |
|
76 | Both of this commands do nothing but print a list of proposed changes, | |
77 | which may include changes unrelated to the dirstate. |
|
77 | which may include changes unrelated to the dirstate. | |
78 | Those other changes are controlled by their own configuration keys. |
|
78 | Those other changes are controlled by their own configuration keys. | |
79 | Add `--run` to a command to actually apply the proposed changes. |
|
79 | Add `--run` to a command to actually apply the proposed changes. | |
80 |
|
80 | |||
81 | Backups of `.hg/requires` and `.hg/dirstate` are created |
|
81 | Backups of `.hg/requires` and `.hg/dirstate` are created | |
82 | in a `.hg/upgradebackup.*` directory. |
|
82 | in a `.hg/upgradebackup.*` directory. | |
83 | If something goes wrong, restoring those files should undo the change. |
|
83 | If something goes wrong, restoring those files should undo the change. | |
84 |
|
84 | |||
85 | Note that upgrading affects compatibility with older versions of Mercurial |
|
85 | Note that upgrading affects compatibility with older versions of Mercurial | |
86 | as noted above. |
|
86 | as noted above. | |
87 | This can be relevant when a repositoryβs files are on a USB drive |
|
87 | This can be relevant when a repositoryβs files are on a USB drive | |
88 | or some other removable media, or shared over the network, etc. |
|
88 | or some other removable media, or shared over the network, etc. | |
89 |
|
89 | |||
90 | Internal filesystem representation |
|
90 | Internal filesystem representation | |
91 | ================================== |
|
91 | ================================== | |
92 |
|
92 | |||
93 | Requirements file |
|
93 | Requirements file | |
94 | ----------------- |
|
94 | ----------------- | |
95 |
|
95 | |||
96 | The `.hg/requires` file indicates which of various optional file formats |
|
96 | The `.hg/requires` file indicates which of various optional file formats | |
97 | are used by a given repository. |
|
97 | are used by a given repository. | |
98 | Mercurial aborts when seeing a requirement it does not know about, |
|
98 | Mercurial aborts when seeing a requirement it does not know about, | |
99 | which avoids older version accidentally messing up a respository |
|
99 | which avoids older version accidentally messing up a respository | |
100 | that uses a format that was introduced later. |
|
100 | that uses a format that was introduced later. | |
101 | For versions that do support a format, the presence or absence of |
|
101 | For versions that do support a format, the presence or absence of | |
102 | the corresponding requirement indicates whether to use that format. |
|
102 | the corresponding requirement indicates whether to use that format. | |
103 |
|
103 | |||
104 | When the file contains a `exp-dirstate-v2` line, |
|
104 | When the file contains a `exp-dirstate-v2` line, | |
105 | the `dirstate-v2` format is used. |
|
105 | the `dirstate-v2` format is used. | |
106 | With no such line `dirstate-v1` is used. |
|
106 | With no such line `dirstate-v1` is used. | |
107 |
|
107 | |||
108 | High level description |
|
108 | High level description | |
109 | ---------------------- |
|
109 | ---------------------- | |
110 |
|
110 | |||
111 | Whereas `dirstate-v1` uses a single `.hg/disrtate` file, |
|
111 | Whereas `dirstate-v1` uses a single `.hg/disrtate` file, | |
112 | in `dirstate-v2` that file is a "docket" file |
|
112 | in `dirstate-v2` that file is a "docket" file | |
113 | that only contains some metadata |
|
113 | that only contains some metadata | |
114 | and points to separate data file named `.hg/dirstate.{ID}`, |
|
114 | and points to separate data file named `.hg/dirstate.{ID}`, | |
115 | where `{ID}` is a random identifier. |
|
115 | where `{ID}` is a random identifier. | |
116 |
|
116 | |||
117 | This separation allows making data files append-only |
|
117 | This separation allows making data files append-only | |
118 | and therefore safer to memory-map. |
|
118 | and therefore safer to memory-map. | |
119 | Creating a new data file (occasionally to clean up unused data) |
|
119 | Creating a new data file (occasionally to clean up unused data) | |
120 | can be done with a different ID |
|
120 | can be done with a different ID | |
121 | without disrupting another Mercurial process |
|
121 | without disrupting another Mercurial process | |
122 | that could still be using the previous data file. |
|
122 | that could still be using the previous data file. | |
123 |
|
123 | |||
124 | Both files have a format designed to reduce the need for parsing, |
|
124 | Both files have a format designed to reduce the need for parsing, | |
125 | by using fixed-size binary components as much as possible. |
|
125 | by using fixed-size binary components as much as possible. | |
126 | For data that is not fixed-size, |
|
126 | For data that is not fixed-size, | |
127 | references to other parts of a file can be made by storing "pseudo-pointers": |
|
127 | references to other parts of a file can be made by storing "pseudo-pointers": | |
128 | integers counted in bytes from the start of a file. |
|
128 | integers counted in bytes from the start of a file. | |
129 | For read-only access no data structure is needed, |
|
129 | For read-only access no data structure is needed, | |
130 | only a bytes buffer (possibly memory-mapped directly from the filesystem) |
|
130 | only a bytes buffer (possibly memory-mapped directly from the filesystem) | |
131 | with specific parts read on demand. |
|
131 | with specific parts read on demand. | |
132 |
|
132 | |||
133 | The data file contains "nodes" organized in a tree. |
|
133 | The data file contains "nodes" organized in a tree. | |
134 | Each node represents a file or directory inside the working directory |
|
134 | Each node represents a file or directory inside the working directory | |
135 | or its parent changeset. |
|
135 | or its parent changeset. | |
136 | This tree has the same structure as the filesystem, |
|
136 | This tree has the same structure as the filesystem, | |
137 | so a node representing a directory has child nodes representing |
|
137 | so a node representing a directory has child nodes representing | |
138 | the files and subdirectories contained directly in that directory. |
|
138 | the files and subdirectories contained directly in that directory. | |
139 |
|
139 | |||
140 | The docket file format |
|
140 | The docket file format | |
141 | ---------------------- |
|
141 | ---------------------- | |
142 |
|
142 | |||
143 | This is implemented in `rust/hg-core/src/dirstate_tree/on_disk.rs` |
|
143 | This is implemented in `rust/hg-core/src/dirstate_tree/on_disk.rs` | |
144 | and `mercurial/dirstateutils/docket.py`. |
|
144 | and `mercurial/dirstateutils/docket.py`. | |
145 |
|
145 | |||
146 | Components of the docket file are found at fixed offsets, |
|
146 | Components of the docket file are found at fixed offsets, | |
147 | counted in bytes from the start of the file: |
|
147 | counted in bytes from the start of the file: | |
148 |
|
148 | |||
149 | * Offset 0: |
|
149 | * Offset 0: | |
150 | The 12-bytes marker string "dirstate-v2\n" ending with a newline character. |
|
150 | The 12-bytes marker string "dirstate-v2\n" ending with a newline character. | |
151 | This makes it easier to tell a dirstate-v2 file from a dirstate-v1 file, |
|
151 | This makes it easier to tell a dirstate-v2 file from a dirstate-v1 file, | |
152 | although it is not strictly necessary |
|
152 | although it is not strictly necessary | |
153 | since `.hg/requires` determines which format to use. |
|
153 | since `.hg/requires` determines which format to use. | |
154 |
|
154 | |||
155 | * Offset 12: |
|
155 | * Offset 12: | |
156 | The changeset node ID on the first parent of the working directory, |
|
156 | The changeset node ID on the first parent of the working directory, | |
157 | as up to 32 binary bytes. |
|
157 | as up to 32 binary bytes. | |
158 | If a node ID is shorter (20 bytes for SHA-1), |
|
158 | If a node ID is shorter (20 bytes for SHA-1), | |
159 | it is start-aligned and the rest of the bytes are set to zero. |
|
159 | it is start-aligned and the rest of the bytes are set to zero. | |
160 |
|
160 | |||
161 | * Offset 44: |
|
161 | * Offset 44: | |
162 | The changeset node ID on the second parent of the working directory, |
|
162 | The changeset node ID on the second parent of the working directory, | |
163 | or all zeros if there isnβt one. |
|
163 | or all zeros if there isnβt one. | |
164 | Also 32 binary bytes. |
|
164 | Also 32 binary bytes. | |
165 |
|
165 | |||
166 | * Offset 76: |
|
166 | * Offset 76: | |
167 | Tree metadata on 44 bytes, described below. |
|
167 | Tree metadata on 44 bytes, described below. | |
168 | Its separation in this documentation from the rest of the docket |
|
168 | Its separation in this documentation from the rest of the docket | |
169 | reflects a detail of the current implementation. |
|
169 | reflects a detail of the current implementation. | |
170 | Since tree metadata is also made of fields at fixed offsets, those could |
|
170 | Since tree metadata is also made of fields at fixed offsets, those could | |
171 | be inlined here by adding 76 bytes to each offset. |
|
171 | be inlined here by adding 76 bytes to each offset. | |
172 |
|
172 | |||
173 | * Offset 120: |
|
173 | * Offset 120: | |
174 | The used size of the data file, as a 32-bit big-endian integer. |
|
174 | The used size of the data file, as a 32-bit big-endian integer. | |
175 | The actual size of the data file may be larger |
|
175 | The actual size of the data file may be larger | |
176 | (if another Mercurial processis in appending to it |
|
176 | (if another Mercurial processis in appending to it | |
177 | but has not updated the docket yet). |
|
177 | but has not updated the docket yet). | |
178 | That extra data must be ignored. |
|
178 | That extra data must be ignored. | |
179 |
|
179 | |||
180 | * Offset 124: |
|
180 | * Offset 124: | |
181 | The length of the data file identifier, as a 8-bit integer. |
|
181 | The length of the data file identifier, as a 8-bit integer. | |
182 |
|
182 | |||
183 | * Offset 125: |
|
183 | * Offset 125: | |
184 | The data file identifier. |
|
184 | The data file identifier. | |
185 |
|
185 | |||
186 | * Any additional data is current ignored, and dropped when updating the file. |
|
186 | * Any additional data is current ignored, and dropped when updating the file. | |
187 |
|
187 | |||
188 | Tree metadata in the docket file |
|
188 | Tree metadata in the docket file | |
189 | -------------------------------- |
|
189 | -------------------------------- | |
190 |
|
190 | |||
191 | Tree metadata is similarly made of components at fixed offsets. |
|
191 | Tree metadata is similarly made of components at fixed offsets. | |
192 | These offsets are counted in bytes from the start of tree metadata, |
|
192 | These offsets are counted in bytes from the start of tree metadata, | |
193 | which is 76 bytes after the start of the docket file. |
|
193 | which is 76 bytes after the start of the docket file. | |
194 |
|
194 | |||
195 | This metadata can be thought of as the singular root of the tree |
|
195 | This metadata can be thought of as the singular root of the tree | |
196 | formed by nodes in the data file. |
|
196 | formed by nodes in the data file. | |
197 |
|
197 | |||
198 | * Offset 0: |
|
198 | * Offset 0: | |
199 | Pseudo-pointer to the start of root nodes, |
|
199 | Pseudo-pointer to the start of root nodes, | |
200 | counted in bytes from the start of the data file, |
|
200 | counted in bytes from the start of the data file, | |
201 | as a 32-bit big-endian integer. |
|
201 | as a 32-bit big-endian integer. | |
202 | These nodes describe files and directories found directly |
|
202 | These nodes describe files and directories found directly | |
203 | at the root of the working directory. |
|
203 | at the root of the working directory. | |
204 |
|
204 | |||
205 | * Offset 4: |
|
205 | * Offset 4: | |
206 | Number of root nodes, as a 32-bit big-endian integer. |
|
206 | Number of root nodes, as a 32-bit big-endian integer. | |
207 |
|
207 | |||
208 | * Offset 8: |
|
208 | * Offset 8: | |
209 | Total number of nodes in the entire tree that "have a dirstate entry", |
|
209 | Total number of nodes in the entire tree that "have a dirstate entry", | |
210 | as a 32-bit big-endian integer. |
|
210 | as a 32-bit big-endian integer. | |
211 | Those nodes represent files that would be present at all in `dirstate-v1`. |
|
211 | Those nodes represent files that would be present at all in `dirstate-v1`. | |
212 | This is typically less than the total number of nodes. |
|
212 | This is typically less than the total number of nodes. | |
213 | This counter is used to implement `len(dirstatemap)`. |
|
213 | This counter is used to implement `len(dirstatemap)`. | |
214 |
|
214 | |||
215 | * Offset 12: |
|
215 | * Offset 12: | |
216 | Number of nodes in the entire tree that have a copy source, |
|
216 | Number of nodes in the entire tree that have a copy source, | |
217 | as a 32-bit big-endian integer. |
|
217 | as a 32-bit big-endian integer. | |
218 | At the next commit, these files are recorded |
|
218 | At the next commit, these files are recorded | |
219 | as having been copied or moved/renamed from that source. |
|
219 | as having been copied or moved/renamed from that source. | |
220 | (A move is recorded as a copy and separate removal of the source.) |
|
220 | (A move is recorded as a copy and separate removal of the source.) | |
221 | This counter is used to implement `len(dirstatemap.copymap)`. |
|
221 | This counter is used to implement `len(dirstatemap.copymap)`. | |
222 |
|
222 | |||
223 | * Offset 16: |
|
223 | * Offset 16: | |
224 | An estimation of how many bytes of the data file |
|
224 | An estimation of how many bytes of the data file | |
225 | (within its used size) are unused, as a 32-bit big-endian integer. |
|
225 | (within its used size) are unused, as a 32-bit big-endian integer. | |
226 | When appending to an existing data file, |
|
226 | When appending to an existing data file, | |
227 | some existing nodes or paths can be unreachable from the new root |
|
227 | some existing nodes or paths can be unreachable from the new root | |
228 | but they still take up space. |
|
228 | but they still take up space. | |
229 | This counter is used to decide when to write a new data file from scratch |
|
229 | This counter is used to decide when to write a new data file from scratch | |
230 | instead of appending to an existing one, |
|
230 | instead of appending to an existing one, | |
231 | in order to get rid of that unreachable data |
|
231 | in order to get rid of that unreachable data | |
232 | and avoid unbounded file size growth. |
|
232 | and avoid unbounded file size growth. | |
233 |
|
233 | |||
234 | * Offset 20: |
|
234 | * Offset 20: | |
235 | These four bytes are currently ignored |
|
235 | These four bytes are currently ignored | |
236 | and reset to zero when updating a docket file. |
|
236 | and reset to zero when updating a docket file. | |
237 | This is an attempt at forward compatibility: |
|
237 | This is an attempt at forward compatibility: | |
238 | future Mercurial versions could use this as a bit field |
|
238 | future Mercurial versions could use this as a bit field | |
239 | to indicate that a dirstate has additional data or constraints. |
|
239 | to indicate that a dirstate has additional data or constraints. | |
240 | Finding a dirstate file with the relevant bit unset indicates that |
|
240 | Finding a dirstate file with the relevant bit unset indicates that | |
241 | it was written by a then-older version |
|
241 | it was written by a then-older version | |
242 | which is not aware of that future change. |
|
242 | which is not aware of that future change. | |
243 |
|
243 | |||
244 | * Offset 24: |
|
244 | * Offset 24: | |
245 | Either 20 zero bytes, or a SHA-1 hash as 20 binary bytes. |
|
245 | Either 20 zero bytes, or a SHA-1 hash as 20 binary bytes. | |
246 | When present, the hash is of ignore patterns |
|
246 | When present, the hash is of ignore patterns | |
247 | that were used for some previous run of the `status` algorithm. |
|
247 | that were used for some previous run of the `status` algorithm. | |
248 |
|
248 | |||
249 | * (Offset 44: end of tree metadata) |
|
249 | * (Offset 44: end of tree metadata) | |
250 |
|
250 | |||
251 | Optional hash of ignore patterns |
|
251 | Optional hash of ignore patterns | |
252 | -------------------------------- |
|
252 | -------------------------------- | |
253 |
|
253 | |||
254 | The implementation of `status` at `rust/hg-core/src/dirstate_tree/status.rs` |
|
254 | The implementation of `status` at `rust/hg-core/src/dirstate_tree/status.rs` | |
255 | has been optimized such that its run time is dominated by calls |
|
255 | has been optimized such that its run time is dominated by calls | |
256 | to `stat` for reading the filesystem metadata of a file or directory, |
|
256 | to `stat` for reading the filesystem metadata of a file or directory, | |
257 | and to `readdir` for listing the contents of a directory. |
|
257 | and to `readdir` for listing the contents of a directory. | |
258 | In some cases the algorithm can skip calls to `readdir` |
|
258 | In some cases the algorithm can skip calls to `readdir` | |
259 | (saving significant time) |
|
259 | (saving significant time) | |
260 | because the dirstate already contains enough of the relevant information |
|
260 | because the dirstate already contains enough of the relevant information | |
261 | to build the correct `status` results. |
|
261 | to build the correct `status` results. | |
262 |
|
262 | |||
263 | The default configuration of `hg status` is to list unknown files |
|
263 | The default configuration of `hg status` is to list unknown files | |
264 | but not ignored files. |
|
264 | but not ignored files. | |
265 | In this case, it matters for the `readdir`-skipping optimization |
|
265 | In this case, it matters for the `readdir`-skipping optimization | |
266 | if a given file used to be ignored but became unknown |
|
266 | if a given file used to be ignored but became unknown | |
267 | because `.hgignore` changed. |
|
267 | because `.hgignore` changed. | |
268 | To detect the possibility of such a change, |
|
268 | To detect the possibility of such a change, | |
269 | the tree metadata contains an optional hash of all ignore patterns. |
|
269 | the tree metadata contains an optional hash of all ignore patterns. | |
270 |
|
270 | |||
271 | We define: |
|
271 | We define: | |
272 |
|
272 | |||
273 | * "Root" ignore files as: |
|
273 | * "Root" ignore files as: | |
274 |
|
274 | |||
275 | - `.hgignore` at the root of the repository if it exists |
|
275 | - `.hgignore` at the root of the repository if it exists | |
276 | - And all files from `ui.ignore.*` config. |
|
276 | - And all files from `ui.ignore.*` config. | |
277 |
|
277 | |||
278 | This set of files is sorted by the string representation of their path. |
|
278 | This set of files is sorted by the string representation of their path. | |
279 |
|
279 | |||
280 | * The "expanded contents" of an ignore files is the byte string made |
|
280 | * The "expanded contents" of an ignore files is the byte string made | |
281 | by the concatenation of its contents followed by the "expanded contents" |
|
281 | by the concatenation of its contents followed by the "expanded contents" | |
282 | of other files included with `include:` or `subinclude:` directives, |
|
282 | of other files included with `include:` or `subinclude:` directives, | |
283 | in inclusion order. This definition is recursive, as included files can |
|
283 | in inclusion order. This definition is recursive, as included files can | |
284 | themselves include more files. |
|
284 | themselves include more files. | |
285 |
|
285 | |||
286 | This hash is defined as the SHA-1 of the concatenation (in sorted |
|
286 | This hash is defined as the SHA-1 of the concatenation (in sorted | |
287 | order) of the "expanded contents" of each "root" ignore file. |
|
287 | order) of the "expanded contents" of each "root" ignore file. | |
288 | (Note that computing this does not require actually concatenating |
|
288 | (Note that computing this does not require actually concatenating | |
289 | into a single contiguous byte sequence. |
|
289 | into a single contiguous byte sequence. | |
290 | Instead a SHA-1 hasher object can be created |
|
290 | Instead a SHA-1 hasher object can be created | |
291 | and fed separate chunks one by one.) |
|
291 | and fed separate chunks one by one.) | |
292 |
|
292 | |||
293 | The data file format |
|
293 | The data file format | |
294 | -------------------- |
|
294 | -------------------- | |
295 |
|
295 | |||
296 | This is implemented in `rust/hg-core/src/dirstate_tree/on_disk.rs` |
|
296 | This is implemented in `rust/hg-core/src/dirstate_tree/on_disk.rs` | |
297 | and `mercurial/dirstateutils/v2.py`. |
|
297 | and `mercurial/dirstateutils/v2.py`. | |
298 |
|
298 | |||
299 | The data file contains two types of data: paths and nodes. |
|
299 | The data file contains two types of data: paths and nodes. | |
300 |
|
300 | |||
301 | Paths and nodes can be organized in any order in the file, except that sibling |
|
301 | Paths and nodes can be organized in any order in the file, except that sibling | |
302 | nodes must be next to each other and sorted by their path. |
|
302 | nodes must be next to each other and sorted by their path. | |
303 | Contiguity lets the parent refer to them all |
|
303 | Contiguity lets the parent refer to them all | |
304 | by their count and a single pseudo-pointer, |
|
304 | by their count and a single pseudo-pointer, | |
305 | instead of storing one pseudo-pointer per child node. |
|
305 | instead of storing one pseudo-pointer per child node. | |
306 | Sorting allows using binary seach to find a child node with a given name |
|
306 | Sorting allows using binary seach to find a child node with a given name | |
307 | in `O(log(n))` byte sequence comparisons. |
|
307 | in `O(log(n))` byte sequence comparisons. | |
308 |
|
308 | |||
309 | The current implemention writes paths and child node before a given node |
|
309 | The current implemention writes paths and child node before a given node | |
310 | for ease of figuring out the value of pseudo-pointers by the time the are to be |
|
310 | for ease of figuring out the value of pseudo-pointers by the time the are to be | |
311 | written, but this is not an obligation and readers must not rely on it. |
|
311 | written, but this is not an obligation and readers must not rely on it. | |
312 |
|
312 | |||
313 | A path is stored as a byte string anywhere in the file, without delimiter. |
|
313 | A path is stored as a byte string anywhere in the file, without delimiter. | |
314 | It is refered to by one or more node by a pseudo-pointer to its start, and its |
|
314 | It is refered to by one or more node by a pseudo-pointer to its start, and its | |
315 | length in bytes. Since there is no delimiter, |
|
315 | length in bytes. Since there is no delimiter, | |
316 | when a path is a substring of another the same bytes could be reused, |
|
316 | when a path is a substring of another the same bytes could be reused, | |
317 | although the implementation does not exploit this as of this writing. |
|
317 | although the implementation does not exploit this as of this writing. | |
318 |
|
318 | |||
319 | A node is stored on 43 bytes with components at fixed offsets. Paths and |
|
319 | A node is stored on 43 bytes with components at fixed offsets. Paths and | |
320 | child nodes relevant to a node are stored externally and referenced though |
|
320 | child nodes relevant to a node are stored externally and referenced though | |
321 | pseudo-pointers. |
|
321 | pseudo-pointers. | |
322 |
|
322 | |||
323 | All integers are stored in big-endian. All pseudo-pointers are 32-bit integers |
|
323 | All integers are stored in big-endian. All pseudo-pointers are 32-bit integers | |
324 | counting bytes from the start of the data file. Path lengths and positions |
|
324 | counting bytes from the start of the data file. Path lengths and positions | |
325 | are 16-bit integers, also counted in bytes. |
|
325 | are 16-bit integers, also counted in bytes. | |
326 |
|
326 | |||
327 | Node components are: |
|
327 | Node components are: | |
328 |
|
328 | |||
329 | * Offset 0: |
|
329 | * Offset 0: | |
330 | Pseudo-pointer to the full path of this node, |
|
330 | Pseudo-pointer to the full path of this node, | |
331 | from the working directory root. |
|
331 | from the working directory root. | |
332 |
|
332 | |||
333 | * Offset 4: |
|
333 | * Offset 4: | |
334 | Length of the full path. |
|
334 | Length of the full path. | |
335 |
|
335 | |||
336 | * Offset 6: |
|
336 | * Offset 6: | |
337 | Position of the last `/` path separator within the full path, |
|
337 | Position of the last `/` path separator within the full path, | |
338 | in bytes from the start of the full path, |
|
338 | in bytes from the start of the full path, | |
339 | or zero if there isnβt one. |
|
339 | or zero if there isnβt one. | |
340 | The part of the full path after this position is the "base name". |
|
340 | The part of the full path after this position is the "base name". | |
341 | Since sibling nodes have the same parent, only their base name vary |
|
341 | Since sibling nodes have the same parent, only their base name vary | |
342 | and needs to be considered when doing binary search to find a given path. |
|
342 | and needs to be considered when doing binary search to find a given path. | |
343 |
|
343 | |||
344 | * Offset 8: |
|
344 | * Offset 8: | |
345 | Pseudo-pointer to the "copy source" path for this node, |
|
345 | Pseudo-pointer to the "copy source" path for this node, | |
346 | or zero if there is no copy source. |
|
346 | or zero if there is no copy source. | |
347 |
|
347 | |||
348 | * Offset 12: |
|
348 | * Offset 12: | |
349 | Length of the copy source path, or zero if there isnβt one. |
|
349 | Length of the copy source path, or zero if there isnβt one. | |
350 |
|
350 | |||
351 | * Offset 14: |
|
351 | * Offset 14: | |
352 | Pseudo-pointer to the start of child nodes. |
|
352 | Pseudo-pointer to the start of child nodes. | |
353 |
|
353 | |||
354 | * Offset 18: |
|
354 | * Offset 18: | |
355 | Number of child nodes, as a 32-bit integer. |
|
355 | Number of child nodes, as a 32-bit integer. | |
356 | They occupy 43 times this number of bytes |
|
356 | They occupy 43 times this number of bytes | |
357 | (not counting space for paths, and further descendants). |
|
357 | (not counting space for paths, and further descendants). | |
358 |
|
358 | |||
359 | * Offset 22: |
|
359 | * Offset 22: | |
360 | Number as a 32-bit integer of descendant nodes in this subtree, |
|
360 | Number as a 32-bit integer of descendant nodes in this subtree, | |
361 | not including this node itself, |
|
361 | not including this node itself, | |
362 | that "have a dirstate entry". |
|
362 | that "have a dirstate entry". | |
363 | Those nodes represent files that would be present at all in `dirstate-v1`. |
|
363 | Those nodes represent files that would be present at all in `dirstate-v1`. | |
364 | This is typically less than the total number of descendants. |
|
364 | This is typically less than the total number of descendants. | |
365 | This counter is used to implement `has_dir`. |
|
365 | This counter is used to implement `has_dir`. | |
366 |
|
366 | |||
367 | * Offset 26: |
|
367 | * Offset 26: | |
368 | Number as a 32-bit integer of descendant nodes in this subtree, |
|
368 | Number as a 32-bit integer of descendant nodes in this subtree, | |
369 | not including this node itself, |
|
369 | not including this node itself, | |
370 | that represent files tracked in the working directory. |
|
370 | that represent files tracked in the working directory. | |
371 | (For example, `hg rm` makes a file untracked.) |
|
371 | (For example, `hg rm` makes a file untracked.) | |
372 | This counter is used to implement `has_tracked_dir`. |
|
372 | This counter is used to implement `has_tracked_dir`. | |
373 |
|
373 | |||
374 | * Offset 30: |
|
374 | * Offset 30: | |
375 | A `flags` fields that packs some boolean values as bits of a 16-bit integer. |
|
375 | A `flags` fields that packs some boolean values as bits of a 16-bit integer. | |
376 | Starting from least-significant, bit masks are:: |
|
376 | Starting from least-significant, bit masks are:: | |
377 |
|
377 | |||
378 | WDIR_TRACKED = 1 << 0 |
|
378 | WDIR_TRACKED = 1 << 0 | |
379 | P1_TRACKED = 1 << 1 |
|
379 | P1_TRACKED = 1 << 1 | |
380 | P2_INFO = 1 << 2 |
|
380 | P2_INFO = 1 << 2 | |
381 | HAS_MODE_AND_SIZE = 1 << 3 |
|
381 | HAS_MODE_AND_SIZE = 1 << 3 | |
382 | HAS_FILE_MTIME = 1 << 4 |
|
382 | HAS_FILE_MTIME = 1 << 4 | |
383 | HAS_DIRECTORY_MTIME = 1 << 5 |
|
383 | HAS_DIRECTORY_MTIME = 1 << 5 | |
384 | MODE_EXEC_PERM = 1 << 6 |
|
384 | MODE_EXEC_PERM = 1 << 6 | |
385 | MODE_IS_SYMLINK = 1 << 7 |
|
385 | MODE_IS_SYMLINK = 1 << 7 | |
386 | EXPECTED_STATE_IS_MODIFIED = 1 << 8 |
|
386 | EXPECTED_STATE_IS_MODIFIED = 1 << 8 | |
387 | ALL_UNKNOWN_RECORDED = 1 << 9 |
|
387 | ALL_UNKNOWN_RECORDED = 1 << 9 | |
388 | ALL_IGNORED_RECORDED = 1 << 10 |
|
388 | ALL_IGNORED_RECORDED = 1 << 10 | |
|
389 | HAS_FALLBACK_EXEC = 1 << 11 | |||
|
390 | FALLBACK_EXEC = 1 << 12 | |||
|
391 | HAS_FALLBACK_SYMLINK = 1 << 13 | |||
|
392 | FALLBACK_SYMLINK = 1 << 14 | |||
389 |
|
393 | |||
390 | The meaning of each bit is described below. |
|
394 | The meaning of each bit is described below. | |
391 |
|
395 | |||
392 | Other bits are unset. |
|
396 | Other bits are unset. | |
393 | They may be assigned meaning if the future, |
|
397 | They may be assigned meaning if the future, | |
394 | with the limitation that Mercurial versions that pre-date such meaning |
|
398 | with the limitation that Mercurial versions that pre-date such meaning | |
395 | will always reset those bits to unset when writing nodes. |
|
399 | will always reset those bits to unset when writing nodes. | |
396 | (A new node is written for any mutation in its subtree, |
|
400 | (A new node is written for any mutation in its subtree, | |
397 | leaving the bytes of the old node unreachable |
|
401 | leaving the bytes of the old node unreachable | |
398 | until the data file is rewritten entirely.) |
|
402 | until the data file is rewritten entirely.) | |
399 |
|
403 | |||
400 | * Offset 32: |
|
404 | * Offset 32: | |
401 | A `size` field described below, as a 32-bit integer. |
|
405 | A `size` field described below, as a 32-bit integer. | |
402 | Unlike in dirstate-v1, negative values are not used. |
|
406 | Unlike in dirstate-v1, negative values are not used. | |
403 |
|
407 | |||
404 | * Offset 36: |
|
408 | * Offset 36: | |
405 | The seconds component of an `mtime` field described below, |
|
409 | The seconds component of an `mtime` field described below, | |
406 | as a 32-bit integer. |
|
410 | as a 32-bit integer. | |
407 | Unlike in dirstate-v1, negative values are not used. |
|
411 | Unlike in dirstate-v1, negative values are not used. | |
408 | When `mtime` is used, this is number of seconds since the Unix epoch |
|
412 | When `mtime` is used, this is number of seconds since the Unix epoch | |
409 | truncated to its lower 31 bits. |
|
413 | truncated to its lower 31 bits. | |
410 |
|
414 | |||
411 | * Offset 40: |
|
415 | * Offset 40: | |
412 | The nanoseconds component of an `mtime` field described below, |
|
416 | The nanoseconds component of an `mtime` field described below, | |
413 | as a 32-bit integer. |
|
417 | as a 32-bit integer. | |
414 | When `mtime` is used, |
|
418 | When `mtime` is used, | |
415 | this is the number of nanoseconds since `mtime.seconds`, |
|
419 | this is the number of nanoseconds since `mtime.seconds`, | |
416 | always stritctly less than one billion. |
|
420 | always stritctly less than one billion. | |
417 |
|
421 | |||
418 | This may be zero if more precision is not available. |
|
422 | This may be zero if more precision is not available. | |
419 | (This can happen because of limitations in any of Mercurial, Python, |
|
423 | (This can happen because of limitations in any of Mercurial, Python, | |
420 | libc, the operating system, β¦) |
|
424 | libc, the operating system, β¦) | |
421 |
|
425 | |||
422 | When comparing two mtimes and either has this component set to zero, |
|
426 | When comparing two mtimes and either has this component set to zero, | |
423 | the sub-second precision of both should be ignored. |
|
427 | the sub-second precision of both should be ignored. | |
424 | False positives when checking mtime equality due to clock resolution |
|
428 | False positives when checking mtime equality due to clock resolution | |
425 | are always possible and the status algorithm needs to deal with them, |
|
429 | are always possible and the status algorithm needs to deal with them, | |
426 | but having too many false negatives could be harmful too. |
|
430 | but having too many false negatives could be harmful too. | |
427 |
|
431 | |||
428 | * (Offset 44: end of this node) |
|
432 | * (Offset 44: end of this node) | |
429 |
|
433 | |||
430 | The meaning of the boolean values packed in `flags` is: |
|
434 | The meaning of the boolean values packed in `flags` is: | |
431 |
|
435 | |||
432 | `WDIR_TRACKED` |
|
436 | `WDIR_TRACKED` | |
433 | Set if the working directory contains a tracked file at this nodeβs path. |
|
437 | Set if the working directory contains a tracked file at this nodeβs path. | |
434 | This is typically set and unset by `hg add` and `hg rm`. |
|
438 | This is typically set and unset by `hg add` and `hg rm`. | |
435 |
|
439 | |||
436 | `P1_TRACKED` |
|
440 | `P1_TRACKED` | |
437 | Set if the working directoryβs first parent changeset |
|
441 | Set if the working directoryβs first parent changeset | |
438 | (whose node identifier is found in tree metadata) |
|
442 | (whose node identifier is found in tree metadata) | |
439 | contains a tracked file at this nodeβs path. |
|
443 | contains a tracked file at this nodeβs path. | |
440 | This is a cache to reduce manifest lookups. |
|
444 | This is a cache to reduce manifest lookups. | |
441 |
|
445 | |||
442 | `P2_INFO` |
|
446 | `P2_INFO` | |
443 | Set if the file has been involved in some merge operation. |
|
447 | Set if the file has been involved in some merge operation. | |
444 | Either because it was actually merged, |
|
448 | Either because it was actually merged, | |
445 | or because the version in the second parent p2 version was ahead, |
|
449 | or because the version in the second parent p2 version was ahead, | |
446 | or because some rename moved it there. |
|
450 | or because some rename moved it there. | |
447 | In either case `hg status` will want it displayed as modified. |
|
451 | In either case `hg status` will want it displayed as modified. | |
448 |
|
452 | |||
449 | Files that would be mentioned at all in the `dirstate-v1` file format |
|
453 | Files that would be mentioned at all in the `dirstate-v1` file format | |
450 | have a node with at least one of the above three bits set in `dirstate-v2`. |
|
454 | have a node with at least one of the above three bits set in `dirstate-v2`. | |
451 | Letβs call these files "tracked anywhere", |
|
455 | Letβs call these files "tracked anywhere", | |
452 | and "untracked" the nodes with all three of these bits unset. |
|
456 | and "untracked" the nodes with all three of these bits unset. | |
453 | Untracked nodes are typically for directories: |
|
457 | Untracked nodes are typically for directories: | |
454 | they hold child nodes and form the tree structure. |
|
458 | they hold child nodes and form the tree structure. | |
455 | Additional untracked nodes may also exist. |
|
459 | Additional untracked nodes may also exist. | |
456 | Although implementations should strive to clean up nodes |
|
460 | Although implementations should strive to clean up nodes | |
457 | that are entirely unused, other untracked nodes may also exist. |
|
461 | that are entirely unused, other untracked nodes may also exist. | |
458 | For example, a future version of Mercurial might in some cases |
|
462 | For example, a future version of Mercurial might in some cases | |
459 | add nodes for untracked files or/and ignored files in the working directory |
|
463 | add nodes for untracked files or/and ignored files in the working directory | |
460 | in order to optimize `hg status` |
|
464 | in order to optimize `hg status` | |
461 | by enabling it to skip `readdir` in more cases. |
|
465 | by enabling it to skip `readdir` in more cases. | |
462 |
|
466 | |||
463 | `HAS_MODE_AND_SIZE` |
|
467 | `HAS_MODE_AND_SIZE` | |
464 | Must be unset for untracked nodes. |
|
468 | Must be unset for untracked nodes. | |
465 | For files tracked anywhere, if this is set: |
|
469 | For files tracked anywhere, if this is set: | |
466 | - The `size` field is the expected file size, |
|
470 | - The `size` field is the expected file size, | |
467 | in bytes truncated its lower to 31 bits. |
|
471 | in bytes truncated its lower to 31 bits. | |
468 | - The expected execute permission for the fileβs owner |
|
472 | - The expected execute permission for the fileβs owner | |
469 | is given by `MODE_EXEC_PERM` |
|
473 | is given by `MODE_EXEC_PERM` | |
470 | - The expected file type is given by `MODE_IS_SIMLINK`: |
|
474 | - The expected file type is given by `MODE_IS_SIMLINK`: | |
471 | a symbolic link if set, or a normal file if unset. |
|
475 | a symbolic link if set, or a normal file if unset. | |
472 | If this is unset the expected size, permission, and file type are unknown. |
|
476 | If this is unset the expected size, permission, and file type are unknown. | |
473 | The `size` field is unused (set to zero). |
|
477 | The `size` field is unused (set to zero). | |
474 |
|
478 | |||
475 | `HAS_FILE_MTIME` |
|
479 | `HAS_FILE_MTIME` | |
476 | Must be unset for untracked nodes. |
|
480 | Must be unset for untracked nodes. | |
477 | If this and `HAS_DIRECTORY_MTIME` are both unset, |
|
481 | If this and `HAS_DIRECTORY_MTIME` are both unset, | |
478 | the `mtime` field is unused (set to zero). |
|
482 | the `mtime` field is unused (set to zero). | |
479 | If this is set, `mtime` is the expected modification time. |
|
483 | If this is set, `mtime` is the expected modification time. | |
480 |
|
484 | |||
481 | `HAS_DIRECTORY_MTIME` |
|
485 | `HAS_DIRECTORY_MTIME` | |
482 | Must be unset for file tracked anywhere. |
|
486 | Must be unset for file tracked anywhere. | |
483 | If this and `HAS_DIRECTORY_MTIME` are both unset, |
|
487 | If this and `HAS_DIRECTORY_MTIME` are both unset, | |
484 | the `mtime` field is unused (set to zero). |
|
488 | the `mtime` field is unused (set to zero). | |
485 | If this is set, at some point, |
|
489 | If this is set, at some point, | |
486 | this path in the working directory was observed: |
|
490 | this path in the working directory was observed: | |
487 |
|
491 | |||
488 | - To be a directory |
|
492 | - To be a directory | |
489 | - With the modification time given in `mtime` |
|
493 | - With the modification time given in `mtime` | |
490 | - That time was already strictly in the past when observed, |
|
494 | - That time was already strictly in the past when observed, | |
491 | meaning that later changes cannot happen in the same clock tick |
|
495 | meaning that later changes cannot happen in the same clock tick | |
492 | and must cause a different modification time |
|
496 | and must cause a different modification time | |
493 | (unless the system clock jumps back and we get unlucky, |
|
497 | (unless the system clock jumps back and we get unlucky, | |
494 | which is not impossible but deemed unlikely enough). |
|
498 | which is not impossible but deemed unlikely enough). | |
495 | - All direct children of this directory |
|
499 | - All direct children of this directory | |
496 | (as returned by `std::fs::read_dir`) |
|
500 | (as returned by `std::fs::read_dir`) | |
497 | either have a corresponding dirstate node, |
|
501 | either have a corresponding dirstate node, | |
498 | or are ignored by ignore patterns whose hash is in tree metadata. |
|
502 | or are ignored by ignore patterns whose hash is in tree metadata. | |
499 |
|
503 | |||
500 | This means that if `std::fs::symlink_metadata` later reports |
|
504 | This means that if `std::fs::symlink_metadata` later reports | |
501 | the same modification time |
|
505 | the same modification time | |
502 | and ignored patterns havenβt changed, |
|
506 | and ignored patterns havenβt changed, | |
503 | a run of status that is not listing ignored files |
|
507 | a run of status that is not listing ignored files | |
504 | can skip calling `std::fs::read_dir` again for this directory, |
|
508 | can skip calling `std::fs::read_dir` again for this directory, | |
505 | and iterate child dirstate nodes instead. |
|
509 | and iterate child dirstate nodes instead. | |
506 |
|
510 | |||
507 | `MODE_EXEC_PERM` |
|
511 | `MODE_EXEC_PERM` | |
508 | Must be unset if `HAS_MODE_AND_SIZE` is unset. |
|
512 | Must be unset if `HAS_MODE_AND_SIZE` is unset. | |
509 | If `HAS_MODE_AND_SIZE` is set, |
|
513 | If `HAS_MODE_AND_SIZE` is set, | |
510 | this indicates whether the fileβs own is expected |
|
514 | this indicates whether the fileβs own is expected | |
511 | to have execute permission. |
|
515 | to have execute permission. | |
512 |
|
516 | |||
513 | `MODE_IS_SYMLINK` |
|
517 | `MODE_IS_SYMLINK` | |
514 | Must be unset if `HAS_MODE_AND_SIZE` is unset. |
|
518 | Must be unset if `HAS_MODE_AND_SIZE` is unset. | |
515 | If `HAS_MODE_AND_SIZE` is set, |
|
519 | If `HAS_MODE_AND_SIZE` is set, | |
516 | this indicates whether the file is expected to be a symlink |
|
520 | this indicates whether the file is expected to be a symlink | |
517 | as opposed to a normal file. |
|
521 | as opposed to a normal file. | |
518 |
|
522 | |||
519 | `EXPECTED_STATE_IS_MODIFIED` |
|
523 | `EXPECTED_STATE_IS_MODIFIED` | |
520 | Must be unset for untracked nodes. |
|
524 | Must be unset for untracked nodes. | |
521 | For: |
|
525 | For: | |
522 | - a file tracked anywhere |
|
526 | - a file tracked anywhere | |
523 | - that has expected metadata (`HAS_MODE_AND_SIZE` and `HAS_FILE_MTIME`) |
|
527 | - that has expected metadata (`HAS_MODE_AND_SIZE` and `HAS_FILE_MTIME`) | |
524 | - if that metadata matches |
|
528 | - if that metadata matches | |
525 | metadata found in the working directory with `stat` |
|
529 | metadata found in the working directory with `stat` | |
526 | This bit indicates the status of the file. |
|
530 | This bit indicates the status of the file. | |
527 | If set, the status is modified. If unset, it is clean. |
|
531 | If set, the status is modified. If unset, it is clean. | |
528 |
|
532 | |||
529 | In cases where `hg status` needs to read the contents of a file |
|
533 | In cases where `hg status` needs to read the contents of a file | |
530 | because metadata is ambiguous, this bit lets it record the result |
|
534 | because metadata is ambiguous, this bit lets it record the result | |
531 | if the result is modified so that a future run of `hg status` |
|
535 | if the result is modified so that a future run of `hg status` | |
532 | does not need to do the same again. |
|
536 | does not need to do the same again. | |
533 | It is valid to never set this bit, |
|
537 | It is valid to never set this bit, | |
534 | and consider expected metadata ambiguous if it is set. |
|
538 | and consider expected metadata ambiguous if it is set. | |
535 |
|
539 | |||
536 | `ALL_UNKNOWN_RECORDED` |
|
540 | `ALL_UNKNOWN_RECORDED` | |
537 | If set, all "unknown" children existing on disk (at the time of the last |
|
541 | If set, all "unknown" children existing on disk (at the time of the last | |
538 | status) have been recorded and the `mtime` associated with |
|
542 | status) have been recorded and the `mtime` associated with | |
539 | `HAS_DIRECTORY_MTIME` can be used for optimization even when "unknown" file |
|
543 | `HAS_DIRECTORY_MTIME` can be used for optimization even when "unknown" file | |
540 | are listed. |
|
544 | are listed. | |
541 |
|
545 | |||
542 | Note that the amount recorded "unknown" children can still be zero if None |
|
546 | Note that the amount recorded "unknown" children can still be zero if None | |
543 | where present. |
|
547 | where present. | |
544 |
|
548 | |||
545 | Also note that having this flag unset does not imply that no "unknown" |
|
549 | Also note that having this flag unset does not imply that no "unknown" | |
546 | children have been recorded. Some might be present, but there is no garantee |
|
550 | children have been recorded. Some might be present, but there is no garantee | |
547 | that is will be all of them. |
|
551 | that is will be all of them. | |
548 |
|
552 | |||
549 | `ALL_IGNORED_RECORDED` |
|
553 | `ALL_IGNORED_RECORDED` | |
550 | If set, all "ignored" children existing on disk (at the time of the last |
|
554 | If set, all "ignored" children existing on disk (at the time of the last | |
551 | status) have been recorded and the `mtime` associated with |
|
555 | status) have been recorded and the `mtime` associated with | |
552 | `HAS_DIRECTORY_MTIME` can be used for optimization even when "ignored" file |
|
556 | `HAS_DIRECTORY_MTIME` can be used for optimization even when "ignored" file | |
553 | are listed. |
|
557 | are listed. | |
554 |
|
558 | |||
555 | Note that the amount recorded "ignored" children can still be zero if None |
|
559 | Note that the amount recorded "ignored" children can still be zero if None | |
556 | where present. |
|
560 | where present. | |
557 |
|
561 | |||
558 | Also note that having this flag unset does not imply that no "ignored" |
|
562 | Also note that having this flag unset does not imply that no "ignored" | |
559 | children have been recorded. Some might be present, but there is no garantee |
|
563 | children have been recorded. Some might be present, but there is no garantee | |
560 | that is will be all of them. |
|
564 | that is will be all of them. | |
|
565 | ||||
|
566 | `HAS_FALLBACK_EXEC` | |||
|
567 | If this flag is set, the entry carries "fallback" information for the | |||
|
568 | executable bit in the `FALLBACK_EXEC` flag. | |||
|
569 | ||||
|
570 | Fallback information can be stored in the dirstate to keep track of | |||
|
571 | filesystem attribute tracked by Mercurial when the underlying file | |||
|
572 | system or operating system does not support that property, (e.g. | |||
|
573 | Windows). | |||
|
574 | ||||
|
575 | `FALLBACK_EXEC` | |||
|
576 | Should be ignored if `HAS_FALLBACK_EXEC` is unset. If set the file for this | |||
|
577 | entry should be considered executable if that information cannot be | |||
|
578 | extracted from the file system. If unset it should be considered | |||
|
579 | non-executable instead. | |||
|
580 | ||||
|
581 | `HAS_FALLBACK_SYMLINK` | |||
|
582 | If this flag is set, the entry carries "fallback" information for symbolic | |||
|
583 | link status in the `FALLBACK_SYMLINK` flag. | |||
|
584 | ||||
|
585 | Fallback information can be stored in the dirstate to keep track of | |||
|
586 | filesystem attribute tracked by Mercurial when the underlying file | |||
|
587 | system or operating system does not support that property, (e.g. | |||
|
588 | Windows). | |||
|
589 | ||||
|
590 | `FALLBACK_SYMLINK` | |||
|
591 | Should be ignored if `HAS_FALLBACK_SYMLINK` is unset. If set the file for | |||
|
592 | this entry should be considered a symlink if that information cannot be | |||
|
593 | extracted from the file system. If unset it should be considered a normal | |||
|
594 | file instead. |
@@ -1,890 +1,915 b'' | |||||
1 | # parsers.py - Python implementation of parsers.c |
|
1 | # parsers.py - Python implementation of parsers.c | |
2 | # |
|
2 | # | |
3 | # Copyright 2009 Olivia Mackall <olivia@selenic.com> and others |
|
3 | # Copyright 2009 Olivia Mackall <olivia@selenic.com> and others | |
4 | # |
|
4 | # | |
5 | # This software may be used and distributed according to the terms of the |
|
5 | # This software may be used and distributed according to the terms of the | |
6 | # GNU General Public License version 2 or any later version. |
|
6 | # GNU General Public License version 2 or any later version. | |
7 |
|
7 | |||
8 | from __future__ import absolute_import |
|
8 | from __future__ import absolute_import | |
9 |
|
9 | |||
10 | import stat |
|
10 | import stat | |
11 | import struct |
|
11 | import struct | |
12 | import zlib |
|
12 | import zlib | |
13 |
|
13 | |||
14 | from ..node import ( |
|
14 | from ..node import ( | |
15 | nullrev, |
|
15 | nullrev, | |
16 | sha1nodeconstants, |
|
16 | sha1nodeconstants, | |
17 | ) |
|
17 | ) | |
18 | from ..thirdparty import attr |
|
18 | from ..thirdparty import attr | |
19 | from .. import ( |
|
19 | from .. import ( | |
20 | error, |
|
20 | error, | |
21 | pycompat, |
|
21 | pycompat, | |
22 | revlogutils, |
|
22 | revlogutils, | |
23 | util, |
|
23 | util, | |
24 | ) |
|
24 | ) | |
25 |
|
25 | |||
26 | from ..revlogutils import nodemap as nodemaputil |
|
26 | from ..revlogutils import nodemap as nodemaputil | |
27 | from ..revlogutils import constants as revlog_constants |
|
27 | from ..revlogutils import constants as revlog_constants | |
28 |
|
28 | |||
29 | stringio = pycompat.bytesio |
|
29 | stringio = pycompat.bytesio | |
30 |
|
30 | |||
31 |
|
31 | |||
32 | _pack = struct.pack |
|
32 | _pack = struct.pack | |
33 | _unpack = struct.unpack |
|
33 | _unpack = struct.unpack | |
34 | _compress = zlib.compress |
|
34 | _compress = zlib.compress | |
35 | _decompress = zlib.decompress |
|
35 | _decompress = zlib.decompress | |
36 |
|
36 | |||
37 |
|
37 | |||
38 | # a special value used internally for `size` if the file come from the other parent |
|
38 | # a special value used internally for `size` if the file come from the other parent | |
39 | FROM_P2 = -2 |
|
39 | FROM_P2 = -2 | |
40 |
|
40 | |||
41 | # a special value used internally for `size` if the file is modified/merged/added |
|
41 | # a special value used internally for `size` if the file is modified/merged/added | |
42 | NONNORMAL = -1 |
|
42 | NONNORMAL = -1 | |
43 |
|
43 | |||
44 | # a special value used internally for `time` if the time is ambigeous |
|
44 | # a special value used internally for `time` if the time is ambigeous | |
45 | AMBIGUOUS_TIME = -1 |
|
45 | AMBIGUOUS_TIME = -1 | |
46 |
|
46 | |||
47 | # Bits of the `flags` byte inside a node in the file format |
|
47 | # Bits of the `flags` byte inside a node in the file format | |
48 | DIRSTATE_V2_WDIR_TRACKED = 1 << 0 |
|
48 | DIRSTATE_V2_WDIR_TRACKED = 1 << 0 | |
49 | DIRSTATE_V2_P1_TRACKED = 1 << 1 |
|
49 | DIRSTATE_V2_P1_TRACKED = 1 << 1 | |
50 | DIRSTATE_V2_P2_INFO = 1 << 2 |
|
50 | DIRSTATE_V2_P2_INFO = 1 << 2 | |
51 | DIRSTATE_V2_HAS_MODE_AND_SIZE = 1 << 3 |
|
51 | DIRSTATE_V2_HAS_MODE_AND_SIZE = 1 << 3 | |
52 | DIRSTATE_V2_HAS_FILE_MTIME = 1 << 4 |
|
52 | DIRSTATE_V2_HAS_FILE_MTIME = 1 << 4 | |
53 | _DIRSTATE_V2_HAS_DIRCTORY_MTIME = 1 << 5 # Unused when Rust is not available |
|
53 | _DIRSTATE_V2_HAS_DIRCTORY_MTIME = 1 << 5 # Unused when Rust is not available | |
54 | DIRSTATE_V2_MODE_EXEC_PERM = 1 << 6 |
|
54 | DIRSTATE_V2_MODE_EXEC_PERM = 1 << 6 | |
55 | DIRSTATE_V2_MODE_IS_SYMLINK = 1 << 7 |
|
55 | DIRSTATE_V2_MODE_IS_SYMLINK = 1 << 7 | |
56 | DIRSTATE_V2_EXPECTED_STATE_IS_MODIFIED = 1 << 8 |
|
56 | DIRSTATE_V2_EXPECTED_STATE_IS_MODIFIED = 1 << 8 | |
57 | DIRSTATE_V2_ALL_UNKNOWN_RECORDED = 1 << 9 |
|
57 | DIRSTATE_V2_ALL_UNKNOWN_RECORDED = 1 << 9 | |
58 | DIRSTATE_V2_ALL_IGNORED_RECORDED = 1 << 10 |
|
58 | DIRSTATE_V2_ALL_IGNORED_RECORDED = 1 << 10 | |
|
59 | DIRSTATE_V2_HAS_FALLBACK_EXEC = 1 << 11 | |||
|
60 | DIRSTATE_V2_FALLBACK_EXEC = 1 << 12 | |||
|
61 | DIRSTATE_V2_HAS_FALLBACK_SYMLINK = 1 << 13 | |||
|
62 | DIRSTATE_V2_FALLBACK_SYMLINK = 1 << 14 | |||
59 |
|
63 | |||
60 |
|
64 | |||
61 | @attr.s(slots=True, init=False) |
|
65 | @attr.s(slots=True, init=False) | |
62 | class DirstateItem(object): |
|
66 | class DirstateItem(object): | |
63 | """represent a dirstate entry |
|
67 | """represent a dirstate entry | |
64 |
|
68 | |||
65 | It hold multiple attributes |
|
69 | It hold multiple attributes | |
66 |
|
70 | |||
67 | # about file tracking |
|
71 | # about file tracking | |
68 | - wc_tracked: is the file tracked by the working copy |
|
72 | - wc_tracked: is the file tracked by the working copy | |
69 | - p1_tracked: is the file tracked in working copy first parent |
|
73 | - p1_tracked: is the file tracked in working copy first parent | |
70 | - p2_info: the file has been involved in some merge operation. Either |
|
74 | - p2_info: the file has been involved in some merge operation. Either | |
71 | because it was actually merged, or because the p2 version was |
|
75 | because it was actually merged, or because the p2 version was | |
72 | ahead, or because some rename moved it there. In either case |
|
76 | ahead, or because some rename moved it there. In either case | |
73 | `hg status` will want it displayed as modified. |
|
77 | `hg status` will want it displayed as modified. | |
74 |
|
78 | |||
75 | # about the file state expected from p1 manifest: |
|
79 | # about the file state expected from p1 manifest: | |
76 | - mode: the file mode in p1 |
|
80 | - mode: the file mode in p1 | |
77 | - size: the file size in p1 |
|
81 | - size: the file size in p1 | |
78 |
|
82 | |||
79 | These value can be set to None, which mean we don't have a meaningful value |
|
83 | These value can be set to None, which mean we don't have a meaningful value | |
80 | to compare with. Either because we don't really care about them as there |
|
84 | to compare with. Either because we don't really care about them as there | |
81 | `status` is known without having to look at the disk or because we don't |
|
85 | `status` is known without having to look at the disk or because we don't | |
82 | know these right now and a full comparison will be needed to find out if |
|
86 | know these right now and a full comparison will be needed to find out if | |
83 | the file is clean. |
|
87 | the file is clean. | |
84 |
|
88 | |||
85 | # about the file state on disk last time we saw it: |
|
89 | # about the file state on disk last time we saw it: | |
86 | - mtime: the last known clean mtime for the file. |
|
90 | - mtime: the last known clean mtime for the file. | |
87 |
|
91 | |||
88 | This value can be set to None if no cachable state exist. Either because we |
|
92 | This value can be set to None if no cachable state exist. Either because we | |
89 | do not care (see previous section) or because we could not cache something |
|
93 | do not care (see previous section) or because we could not cache something | |
90 | yet. |
|
94 | yet. | |
91 | """ |
|
95 | """ | |
92 |
|
96 | |||
93 | _wc_tracked = attr.ib() |
|
97 | _wc_tracked = attr.ib() | |
94 | _p1_tracked = attr.ib() |
|
98 | _p1_tracked = attr.ib() | |
95 | _p2_info = attr.ib() |
|
99 | _p2_info = attr.ib() | |
96 | _mode = attr.ib() |
|
100 | _mode = attr.ib() | |
97 | _size = attr.ib() |
|
101 | _size = attr.ib() | |
98 | _mtime = attr.ib() |
|
102 | _mtime = attr.ib() | |
99 | _fallback_exec = attr.ib() |
|
103 | _fallback_exec = attr.ib() | |
100 | _fallback_symlink = attr.ib() |
|
104 | _fallback_symlink = attr.ib() | |
101 |
|
105 | |||
102 | def __init__( |
|
106 | def __init__( | |
103 | self, |
|
107 | self, | |
104 | wc_tracked=False, |
|
108 | wc_tracked=False, | |
105 | p1_tracked=False, |
|
109 | p1_tracked=False, | |
106 | p2_info=False, |
|
110 | p2_info=False, | |
107 | has_meaningful_data=True, |
|
111 | has_meaningful_data=True, | |
108 | has_meaningful_mtime=True, |
|
112 | has_meaningful_mtime=True, | |
109 | parentfiledata=None, |
|
113 | parentfiledata=None, | |
110 | fallback_exec=None, |
|
114 | fallback_exec=None, | |
111 | fallback_symlink=None, |
|
115 | fallback_symlink=None, | |
112 | ): |
|
116 | ): | |
113 | self._wc_tracked = wc_tracked |
|
117 | self._wc_tracked = wc_tracked | |
114 | self._p1_tracked = p1_tracked |
|
118 | self._p1_tracked = p1_tracked | |
115 | self._p2_info = p2_info |
|
119 | self._p2_info = p2_info | |
116 |
|
120 | |||
117 | self._fallback_exec = fallback_exec |
|
121 | self._fallback_exec = fallback_exec | |
118 | self._fallback_symlink = fallback_symlink |
|
122 | self._fallback_symlink = fallback_symlink | |
119 |
|
123 | |||
120 | self._mode = None |
|
124 | self._mode = None | |
121 | self._size = None |
|
125 | self._size = None | |
122 | self._mtime = None |
|
126 | self._mtime = None | |
123 | if parentfiledata is None: |
|
127 | if parentfiledata is None: | |
124 | has_meaningful_mtime = False |
|
128 | has_meaningful_mtime = False | |
125 | has_meaningful_data = False |
|
129 | has_meaningful_data = False | |
126 | if has_meaningful_data: |
|
130 | if has_meaningful_data: | |
127 | self._mode = parentfiledata[0] |
|
131 | self._mode = parentfiledata[0] | |
128 | self._size = parentfiledata[1] |
|
132 | self._size = parentfiledata[1] | |
129 | if has_meaningful_mtime: |
|
133 | if has_meaningful_mtime: | |
130 | self._mtime = parentfiledata[2] |
|
134 | self._mtime = parentfiledata[2] | |
131 |
|
135 | |||
132 | @classmethod |
|
136 | @classmethod | |
133 | def from_v2_data(cls, flags, size, mtime): |
|
137 | def from_v2_data(cls, flags, size, mtime): | |
134 | """Build a new DirstateItem object from V2 data""" |
|
138 | """Build a new DirstateItem object from V2 data""" | |
135 | has_mode_size = bool(flags & DIRSTATE_V2_HAS_MODE_AND_SIZE) |
|
139 | has_mode_size = bool(flags & DIRSTATE_V2_HAS_MODE_AND_SIZE) | |
136 | has_meaningful_mtime = bool(flags & DIRSTATE_V2_HAS_FILE_MTIME) |
|
140 | has_meaningful_mtime = bool(flags & DIRSTATE_V2_HAS_FILE_MTIME) | |
137 | mode = None |
|
141 | mode = None | |
138 |
|
142 | |||
139 | if flags & +DIRSTATE_V2_EXPECTED_STATE_IS_MODIFIED: |
|
143 | if flags & +DIRSTATE_V2_EXPECTED_STATE_IS_MODIFIED: | |
140 | # we do not have support for this flag in the code yet, |
|
144 | # we do not have support for this flag in the code yet, | |
141 | # force a lookup for this file. |
|
145 | # force a lookup for this file. | |
142 | has_mode_size = False |
|
146 | has_mode_size = False | |
143 | has_meaningful_mtime = False |
|
147 | has_meaningful_mtime = False | |
144 |
|
148 | |||
|
149 | fallback_exec = None | |||
|
150 | if flags & DIRSTATE_V2_HAS_FALLBACK_EXEC: | |||
|
151 | fallback_exec = flags & DIRSTATE_V2_FALLBACK_EXEC | |||
|
152 | ||||
|
153 | fallback_symlink = None | |||
|
154 | if flags & DIRSTATE_V2_HAS_FALLBACK_SYMLINK: | |||
|
155 | fallback_symlink = flags & DIRSTATE_V2_FALLBACK_SYMLINK | |||
|
156 | ||||
145 | if has_mode_size: |
|
157 | if has_mode_size: | |
146 | assert stat.S_IXUSR == 0o100 |
|
158 | assert stat.S_IXUSR == 0o100 | |
147 | if flags & DIRSTATE_V2_MODE_EXEC_PERM: |
|
159 | if flags & DIRSTATE_V2_MODE_EXEC_PERM: | |
148 | mode = 0o755 |
|
160 | mode = 0o755 | |
149 | else: |
|
161 | else: | |
150 | mode = 0o644 |
|
162 | mode = 0o644 | |
151 | if flags & DIRSTATE_V2_MODE_IS_SYMLINK: |
|
163 | if flags & DIRSTATE_V2_MODE_IS_SYMLINK: | |
152 | mode |= stat.S_IFLNK |
|
164 | mode |= stat.S_IFLNK | |
153 | else: |
|
165 | else: | |
154 | mode |= stat.S_IFREG |
|
166 | mode |= stat.S_IFREG | |
155 | return cls( |
|
167 | return cls( | |
156 | wc_tracked=bool(flags & DIRSTATE_V2_WDIR_TRACKED), |
|
168 | wc_tracked=bool(flags & DIRSTATE_V2_WDIR_TRACKED), | |
157 | p1_tracked=bool(flags & DIRSTATE_V2_P1_TRACKED), |
|
169 | p1_tracked=bool(flags & DIRSTATE_V2_P1_TRACKED), | |
158 | p2_info=bool(flags & DIRSTATE_V2_P2_INFO), |
|
170 | p2_info=bool(flags & DIRSTATE_V2_P2_INFO), | |
159 | has_meaningful_data=has_mode_size, |
|
171 | has_meaningful_data=has_mode_size, | |
160 | has_meaningful_mtime=has_meaningful_mtime, |
|
172 | has_meaningful_mtime=has_meaningful_mtime, | |
161 | parentfiledata=(mode, size, mtime), |
|
173 | parentfiledata=(mode, size, mtime), | |
|
174 | fallback_exec=fallback_exec, | |||
|
175 | fallback_symlink=fallback_symlink, | |||
162 | ) |
|
176 | ) | |
163 |
|
177 | |||
164 | @classmethod |
|
178 | @classmethod | |
165 | def from_v1_data(cls, state, mode, size, mtime): |
|
179 | def from_v1_data(cls, state, mode, size, mtime): | |
166 | """Build a new DirstateItem object from V1 data |
|
180 | """Build a new DirstateItem object from V1 data | |
167 |
|
181 | |||
168 | Since the dirstate-v1 format is frozen, the signature of this function |
|
182 | Since the dirstate-v1 format is frozen, the signature of this function | |
169 | is not expected to change, unlike the __init__ one. |
|
183 | is not expected to change, unlike the __init__ one. | |
170 | """ |
|
184 | """ | |
171 | if state == b'm': |
|
185 | if state == b'm': | |
172 | return cls(wc_tracked=True, p1_tracked=True, p2_info=True) |
|
186 | return cls(wc_tracked=True, p1_tracked=True, p2_info=True) | |
173 | elif state == b'a': |
|
187 | elif state == b'a': | |
174 | return cls(wc_tracked=True) |
|
188 | return cls(wc_tracked=True) | |
175 | elif state == b'r': |
|
189 | elif state == b'r': | |
176 | if size == NONNORMAL: |
|
190 | if size == NONNORMAL: | |
177 | p1_tracked = True |
|
191 | p1_tracked = True | |
178 | p2_info = True |
|
192 | p2_info = True | |
179 | elif size == FROM_P2: |
|
193 | elif size == FROM_P2: | |
180 | p1_tracked = False |
|
194 | p1_tracked = False | |
181 | p2_info = True |
|
195 | p2_info = True | |
182 | else: |
|
196 | else: | |
183 | p1_tracked = True |
|
197 | p1_tracked = True | |
184 | p2_info = False |
|
198 | p2_info = False | |
185 | return cls(p1_tracked=p1_tracked, p2_info=p2_info) |
|
199 | return cls(p1_tracked=p1_tracked, p2_info=p2_info) | |
186 | elif state == b'n': |
|
200 | elif state == b'n': | |
187 | if size == FROM_P2: |
|
201 | if size == FROM_P2: | |
188 | return cls(wc_tracked=True, p2_info=True) |
|
202 | return cls(wc_tracked=True, p2_info=True) | |
189 | elif size == NONNORMAL: |
|
203 | elif size == NONNORMAL: | |
190 | return cls(wc_tracked=True, p1_tracked=True) |
|
204 | return cls(wc_tracked=True, p1_tracked=True) | |
191 | elif mtime == AMBIGUOUS_TIME: |
|
205 | elif mtime == AMBIGUOUS_TIME: | |
192 | return cls( |
|
206 | return cls( | |
193 | wc_tracked=True, |
|
207 | wc_tracked=True, | |
194 | p1_tracked=True, |
|
208 | p1_tracked=True, | |
195 | has_meaningful_mtime=False, |
|
209 | has_meaningful_mtime=False, | |
196 | parentfiledata=(mode, size, 42), |
|
210 | parentfiledata=(mode, size, 42), | |
197 | ) |
|
211 | ) | |
198 | else: |
|
212 | else: | |
199 | return cls( |
|
213 | return cls( | |
200 | wc_tracked=True, |
|
214 | wc_tracked=True, | |
201 | p1_tracked=True, |
|
215 | p1_tracked=True, | |
202 | parentfiledata=(mode, size, mtime), |
|
216 | parentfiledata=(mode, size, mtime), | |
203 | ) |
|
217 | ) | |
204 | else: |
|
218 | else: | |
205 | raise RuntimeError(b'unknown state: %s' % state) |
|
219 | raise RuntimeError(b'unknown state: %s' % state) | |
206 |
|
220 | |||
207 | def set_possibly_dirty(self): |
|
221 | def set_possibly_dirty(self): | |
208 | """Mark a file as "possibly dirty" |
|
222 | """Mark a file as "possibly dirty" | |
209 |
|
223 | |||
210 | This means the next status call will have to actually check its content |
|
224 | This means the next status call will have to actually check its content | |
211 | to make sure it is correct. |
|
225 | to make sure it is correct. | |
212 | """ |
|
226 | """ | |
213 | self._mtime = None |
|
227 | self._mtime = None | |
214 |
|
228 | |||
215 | def set_clean(self, mode, size, mtime): |
|
229 | def set_clean(self, mode, size, mtime): | |
216 | """mark a file as "clean" cancelling potential "possibly dirty call" |
|
230 | """mark a file as "clean" cancelling potential "possibly dirty call" | |
217 |
|
231 | |||
218 | Note: this function is a descendant of `dirstate.normal` and is |
|
232 | Note: this function is a descendant of `dirstate.normal` and is | |
219 | currently expected to be call on "normal" entry only. There are not |
|
233 | currently expected to be call on "normal" entry only. There are not | |
220 | reason for this to not change in the future as long as the ccode is |
|
234 | reason for this to not change in the future as long as the ccode is | |
221 | updated to preserve the proper state of the non-normal files. |
|
235 | updated to preserve the proper state of the non-normal files. | |
222 | """ |
|
236 | """ | |
223 | self._wc_tracked = True |
|
237 | self._wc_tracked = True | |
224 | self._p1_tracked = True |
|
238 | self._p1_tracked = True | |
225 | self._mode = mode |
|
239 | self._mode = mode | |
226 | self._size = size |
|
240 | self._size = size | |
227 | self._mtime = mtime |
|
241 | self._mtime = mtime | |
228 |
|
242 | |||
229 | def set_tracked(self): |
|
243 | def set_tracked(self): | |
230 | """mark a file as tracked in the working copy |
|
244 | """mark a file as tracked in the working copy | |
231 |
|
245 | |||
232 | This will ultimately be called by command like `hg add`. |
|
246 | This will ultimately be called by command like `hg add`. | |
233 | """ |
|
247 | """ | |
234 | self._wc_tracked = True |
|
248 | self._wc_tracked = True | |
235 | # `set_tracked` is replacing various `normallookup` call. So we mark |
|
249 | # `set_tracked` is replacing various `normallookup` call. So we mark | |
236 | # the files as needing lookup |
|
250 | # the files as needing lookup | |
237 | # |
|
251 | # | |
238 | # Consider dropping this in the future in favor of something less broad. |
|
252 | # Consider dropping this in the future in favor of something less broad. | |
239 | self._mtime = None |
|
253 | self._mtime = None | |
240 |
|
254 | |||
241 | def set_untracked(self): |
|
255 | def set_untracked(self): | |
242 | """mark a file as untracked in the working copy |
|
256 | """mark a file as untracked in the working copy | |
243 |
|
257 | |||
244 | This will ultimately be called by command like `hg remove`. |
|
258 | This will ultimately be called by command like `hg remove`. | |
245 | """ |
|
259 | """ | |
246 | self._wc_tracked = False |
|
260 | self._wc_tracked = False | |
247 | self._mode = None |
|
261 | self._mode = None | |
248 | self._size = None |
|
262 | self._size = None | |
249 | self._mtime = None |
|
263 | self._mtime = None | |
250 |
|
264 | |||
251 | def drop_merge_data(self): |
|
265 | def drop_merge_data(self): | |
252 | """remove all "merge-only" from a DirstateItem |
|
266 | """remove all "merge-only" from a DirstateItem | |
253 |
|
267 | |||
254 | This is to be call by the dirstatemap code when the second parent is dropped |
|
268 | This is to be call by the dirstatemap code when the second parent is dropped | |
255 | """ |
|
269 | """ | |
256 | if self._p2_info: |
|
270 | if self._p2_info: | |
257 | self._p2_info = False |
|
271 | self._p2_info = False | |
258 | self._mode = None |
|
272 | self._mode = None | |
259 | self._size = None |
|
273 | self._size = None | |
260 | self._mtime = None |
|
274 | self._mtime = None | |
261 |
|
275 | |||
262 | @property |
|
276 | @property | |
263 | def mode(self): |
|
277 | def mode(self): | |
264 | return self.v1_mode() |
|
278 | return self.v1_mode() | |
265 |
|
279 | |||
266 | @property |
|
280 | @property | |
267 | def size(self): |
|
281 | def size(self): | |
268 | return self.v1_size() |
|
282 | return self.v1_size() | |
269 |
|
283 | |||
270 | @property |
|
284 | @property | |
271 | def mtime(self): |
|
285 | def mtime(self): | |
272 | return self.v1_mtime() |
|
286 | return self.v1_mtime() | |
273 |
|
287 | |||
274 | @property |
|
288 | @property | |
275 | def state(self): |
|
289 | def state(self): | |
276 | """ |
|
290 | """ | |
277 | States are: |
|
291 | States are: | |
278 | n normal |
|
292 | n normal | |
279 | m needs merging |
|
293 | m needs merging | |
280 | r marked for removal |
|
294 | r marked for removal | |
281 | a marked for addition |
|
295 | a marked for addition | |
282 |
|
296 | |||
283 | XXX This "state" is a bit obscure and mostly a direct expression of the |
|
297 | XXX This "state" is a bit obscure and mostly a direct expression of the | |
284 | dirstatev1 format. It would make sense to ultimately deprecate it in |
|
298 | dirstatev1 format. It would make sense to ultimately deprecate it in | |
285 | favor of the more "semantic" attributes. |
|
299 | favor of the more "semantic" attributes. | |
286 | """ |
|
300 | """ | |
287 | if not self.any_tracked: |
|
301 | if not self.any_tracked: | |
288 | return b'?' |
|
302 | return b'?' | |
289 | return self.v1_state() |
|
303 | return self.v1_state() | |
290 |
|
304 | |||
291 | @property |
|
305 | @property | |
292 | def has_fallback_exec(self): |
|
306 | def has_fallback_exec(self): | |
293 | """True if "fallback" information are available for the "exec" bit |
|
307 | """True if "fallback" information are available for the "exec" bit | |
294 |
|
308 | |||
295 | Fallback information can be stored in the dirstate to keep track of |
|
309 | Fallback information can be stored in the dirstate to keep track of | |
296 | filesystem attribute tracked by Mercurial when the underlying file |
|
310 | filesystem attribute tracked by Mercurial when the underlying file | |
297 | system or operating system does not support that property, (e.g. |
|
311 | system or operating system does not support that property, (e.g. | |
298 | Windows). |
|
312 | Windows). | |
299 |
|
313 | |||
300 | Not all version of the dirstate on-disk storage support preserving this |
|
314 | Not all version of the dirstate on-disk storage support preserving this | |
301 | information. |
|
315 | information. | |
302 | """ |
|
316 | """ | |
303 | return self._fallback_exec is not None |
|
317 | return self._fallback_exec is not None | |
304 |
|
318 | |||
305 | @property |
|
319 | @property | |
306 | def fallback_exec(self): |
|
320 | def fallback_exec(self): | |
307 | """ "fallback" information for the executable bit |
|
321 | """ "fallback" information for the executable bit | |
308 |
|
322 | |||
309 | True if the file should be considered executable when we cannot get |
|
323 | True if the file should be considered executable when we cannot get | |
310 | this information from the files system. False if it should be |
|
324 | this information from the files system. False if it should be | |
311 | considered non-executable. |
|
325 | considered non-executable. | |
312 |
|
326 | |||
313 | See has_fallback_exec for details.""" |
|
327 | See has_fallback_exec for details.""" | |
314 | return self._fallback_exec |
|
328 | return self._fallback_exec | |
315 |
|
329 | |||
316 | @fallback_exec.setter |
|
330 | @fallback_exec.setter | |
317 | def set_fallback_exec(self, value): |
|
331 | def set_fallback_exec(self, value): | |
318 | """control "fallback" executable bit |
|
332 | """control "fallback" executable bit | |
319 |
|
333 | |||
320 | Set to: |
|
334 | Set to: | |
321 | - True if the file should be considered executable, |
|
335 | - True if the file should be considered executable, | |
322 | - False if the file should be considered non-executable, |
|
336 | - False if the file should be considered non-executable, | |
323 | - None if we do not have valid fallback data. |
|
337 | - None if we do not have valid fallback data. | |
324 |
|
338 | |||
325 | See has_fallback_exec for details.""" |
|
339 | See has_fallback_exec for details.""" | |
326 | if value is None: |
|
340 | if value is None: | |
327 | self._fallback_exec = None |
|
341 | self._fallback_exec = None | |
328 | else: |
|
342 | else: | |
329 | self._fallback_exec = bool(value) |
|
343 | self._fallback_exec = bool(value) | |
330 |
|
344 | |||
331 | @property |
|
345 | @property | |
332 | def has_fallback_symlink(self): |
|
346 | def has_fallback_symlink(self): | |
333 | """True if "fallback" information are available for symlink status |
|
347 | """True if "fallback" information are available for symlink status | |
334 |
|
348 | |||
335 | Fallback information can be stored in the dirstate to keep track of |
|
349 | Fallback information can be stored in the dirstate to keep track of | |
336 | filesystem attribute tracked by Mercurial when the underlying file |
|
350 | filesystem attribute tracked by Mercurial when the underlying file | |
337 | system or operating system does not support that property, (e.g. |
|
351 | system or operating system does not support that property, (e.g. | |
338 | Windows). |
|
352 | Windows). | |
339 |
|
353 | |||
340 | Not all version of the dirstate on-disk storage support preserving this |
|
354 | Not all version of the dirstate on-disk storage support preserving this | |
341 | information.""" |
|
355 | information.""" | |
342 | return self._fallback_symlink is not None |
|
356 | return self._fallback_symlink is not None | |
343 |
|
357 | |||
344 | @property |
|
358 | @property | |
345 | def fallback_symlink(self): |
|
359 | def fallback_symlink(self): | |
346 | """ "fallback" information for symlink status |
|
360 | """ "fallback" information for symlink status | |
347 |
|
361 | |||
348 | True if the file should be considered executable when we cannot get |
|
362 | True if the file should be considered executable when we cannot get | |
349 | this information from the files system. False if it should be |
|
363 | this information from the files system. False if it should be | |
350 | considered non-executable. |
|
364 | considered non-executable. | |
351 |
|
365 | |||
352 | See has_fallback_exec for details.""" |
|
366 | See has_fallback_exec for details.""" | |
353 | return self._fallback_symlink |
|
367 | return self._fallback_symlink | |
354 |
|
368 | |||
355 | @fallback_symlink.setter |
|
369 | @fallback_symlink.setter | |
356 | def set_fallback_symlink(self, value): |
|
370 | def set_fallback_symlink(self, value): | |
357 | """control "fallback" symlink status |
|
371 | """control "fallback" symlink status | |
358 |
|
372 | |||
359 | Set to: |
|
373 | Set to: | |
360 | - True if the file should be considered a symlink, |
|
374 | - True if the file should be considered a symlink, | |
361 | - False if the file should be considered not a symlink, |
|
375 | - False if the file should be considered not a symlink, | |
362 | - None if we do not have valid fallback data. |
|
376 | - None if we do not have valid fallback data. | |
363 |
|
377 | |||
364 | See has_fallback_symlink for details.""" |
|
378 | See has_fallback_symlink for details.""" | |
365 | if value is None: |
|
379 | if value is None: | |
366 | self._fallback_symlink = None |
|
380 | self._fallback_symlink = None | |
367 | else: |
|
381 | else: | |
368 | self._fallback_symlink = bool(value) |
|
382 | self._fallback_symlink = bool(value) | |
369 |
|
383 | |||
370 | @property |
|
384 | @property | |
371 | def tracked(self): |
|
385 | def tracked(self): | |
372 | """True is the file is tracked in the working copy""" |
|
386 | """True is the file is tracked in the working copy""" | |
373 | return self._wc_tracked |
|
387 | return self._wc_tracked | |
374 |
|
388 | |||
375 | @property |
|
389 | @property | |
376 | def any_tracked(self): |
|
390 | def any_tracked(self): | |
377 | """True is the file is tracked anywhere (wc or parents)""" |
|
391 | """True is the file is tracked anywhere (wc or parents)""" | |
378 | return self._wc_tracked or self._p1_tracked or self._p2_info |
|
392 | return self._wc_tracked or self._p1_tracked or self._p2_info | |
379 |
|
393 | |||
380 | @property |
|
394 | @property | |
381 | def added(self): |
|
395 | def added(self): | |
382 | """True if the file has been added""" |
|
396 | """True if the file has been added""" | |
383 | return self._wc_tracked and not (self._p1_tracked or self._p2_info) |
|
397 | return self._wc_tracked and not (self._p1_tracked or self._p2_info) | |
384 |
|
398 | |||
385 | @property |
|
399 | @property | |
386 | def maybe_clean(self): |
|
400 | def maybe_clean(self): | |
387 | """True if the file has a chance to be in the "clean" state""" |
|
401 | """True if the file has a chance to be in the "clean" state""" | |
388 | if not self._wc_tracked: |
|
402 | if not self._wc_tracked: | |
389 | return False |
|
403 | return False | |
390 | elif not self._p1_tracked: |
|
404 | elif not self._p1_tracked: | |
391 | return False |
|
405 | return False | |
392 | elif self._p2_info: |
|
406 | elif self._p2_info: | |
393 | return False |
|
407 | return False | |
394 | return True |
|
408 | return True | |
395 |
|
409 | |||
396 | @property |
|
410 | @property | |
397 | def p1_tracked(self): |
|
411 | def p1_tracked(self): | |
398 | """True if the file is tracked in the first parent manifest""" |
|
412 | """True if the file is tracked in the first parent manifest""" | |
399 | return self._p1_tracked |
|
413 | return self._p1_tracked | |
400 |
|
414 | |||
401 | @property |
|
415 | @property | |
402 | def p2_info(self): |
|
416 | def p2_info(self): | |
403 | """True if the file needed to merge or apply any input from p2 |
|
417 | """True if the file needed to merge or apply any input from p2 | |
404 |
|
418 | |||
405 | See the class documentation for details. |
|
419 | See the class documentation for details. | |
406 | """ |
|
420 | """ | |
407 | return self._wc_tracked and self._p2_info |
|
421 | return self._wc_tracked and self._p2_info | |
408 |
|
422 | |||
409 | @property |
|
423 | @property | |
410 | def removed(self): |
|
424 | def removed(self): | |
411 | """True if the file has been removed""" |
|
425 | """True if the file has been removed""" | |
412 | return not self._wc_tracked and (self._p1_tracked or self._p2_info) |
|
426 | return not self._wc_tracked and (self._p1_tracked or self._p2_info) | |
413 |
|
427 | |||
414 | def v2_data(self): |
|
428 | def v2_data(self): | |
415 | """Returns (flags, mode, size, mtime) for v2 serialization""" |
|
429 | """Returns (flags, mode, size, mtime) for v2 serialization""" | |
416 | flags = 0 |
|
430 | flags = 0 | |
417 | if self._wc_tracked: |
|
431 | if self._wc_tracked: | |
418 | flags |= DIRSTATE_V2_WDIR_TRACKED |
|
432 | flags |= DIRSTATE_V2_WDIR_TRACKED | |
419 | if self._p1_tracked: |
|
433 | if self._p1_tracked: | |
420 | flags |= DIRSTATE_V2_P1_TRACKED |
|
434 | flags |= DIRSTATE_V2_P1_TRACKED | |
421 | if self._p2_info: |
|
435 | if self._p2_info: | |
422 | flags |= DIRSTATE_V2_P2_INFO |
|
436 | flags |= DIRSTATE_V2_P2_INFO | |
423 | if self._mode is not None and self._size is not None: |
|
437 | if self._mode is not None and self._size is not None: | |
424 | flags |= DIRSTATE_V2_HAS_MODE_AND_SIZE |
|
438 | flags |= DIRSTATE_V2_HAS_MODE_AND_SIZE | |
425 | if self.mode & stat.S_IXUSR: |
|
439 | if self.mode & stat.S_IXUSR: | |
426 | flags |= DIRSTATE_V2_MODE_EXEC_PERM |
|
440 | flags |= DIRSTATE_V2_MODE_EXEC_PERM | |
427 | if stat.S_ISLNK(self.mode): |
|
441 | if stat.S_ISLNK(self.mode): | |
428 | flags |= DIRSTATE_V2_MODE_IS_SYMLINK |
|
442 | flags |= DIRSTATE_V2_MODE_IS_SYMLINK | |
429 | if self._mtime is not None: |
|
443 | if self._mtime is not None: | |
430 | flags |= DIRSTATE_V2_HAS_FILE_MTIME |
|
444 | flags |= DIRSTATE_V2_HAS_FILE_MTIME | |
|
445 | ||||
|
446 | if self._fallback_exec is not None: | |||
|
447 | flags |= DIRSTATE_V2_HAS_FALLBACK_EXEC | |||
|
448 | if self._fallback_exec: | |||
|
449 | flags |= DIRSTATE_V2_FALLBACK_EXEC | |||
|
450 | ||||
|
451 | if self._fallback_symlink is not None: | |||
|
452 | flags |= DIRSTATE_V2_HAS_FALLBACK_SYMLINK | |||
|
453 | if self._fallback_symlink: | |||
|
454 | flags |= DIRSTATE_V2_FALLBACK_SYMLINK | |||
|
455 | ||||
431 | # Note: we do not need to do anything regarding |
|
456 | # Note: we do not need to do anything regarding | |
432 | # DIRSTATE_V2_ALL_UNKNOWN_RECORDED and DIRSTATE_V2_ALL_IGNORED_RECORDED |
|
457 | # DIRSTATE_V2_ALL_UNKNOWN_RECORDED and DIRSTATE_V2_ALL_IGNORED_RECORDED | |
433 | # since we never set _DIRSTATE_V2_HAS_DIRCTORY_MTIME |
|
458 | # since we never set _DIRSTATE_V2_HAS_DIRCTORY_MTIME | |
434 | return (flags, self._size or 0, self._mtime or 0) |
|
459 | return (flags, self._size or 0, self._mtime or 0) | |
435 |
|
460 | |||
436 | def v1_state(self): |
|
461 | def v1_state(self): | |
437 | """return a "state" suitable for v1 serialization""" |
|
462 | """return a "state" suitable for v1 serialization""" | |
438 | if not self.any_tracked: |
|
463 | if not self.any_tracked: | |
439 | # the object has no state to record, this is -currently- |
|
464 | # the object has no state to record, this is -currently- | |
440 | # unsupported |
|
465 | # unsupported | |
441 | raise RuntimeError('untracked item') |
|
466 | raise RuntimeError('untracked item') | |
442 | elif self.removed: |
|
467 | elif self.removed: | |
443 | return b'r' |
|
468 | return b'r' | |
444 | elif self._p1_tracked and self._p2_info: |
|
469 | elif self._p1_tracked and self._p2_info: | |
445 | return b'm' |
|
470 | return b'm' | |
446 | elif self.added: |
|
471 | elif self.added: | |
447 | return b'a' |
|
472 | return b'a' | |
448 | else: |
|
473 | else: | |
449 | return b'n' |
|
474 | return b'n' | |
450 |
|
475 | |||
451 | def v1_mode(self): |
|
476 | def v1_mode(self): | |
452 | """return a "mode" suitable for v1 serialization""" |
|
477 | """return a "mode" suitable for v1 serialization""" | |
453 | return self._mode if self._mode is not None else 0 |
|
478 | return self._mode if self._mode is not None else 0 | |
454 |
|
479 | |||
455 | def v1_size(self): |
|
480 | def v1_size(self): | |
456 | """return a "size" suitable for v1 serialization""" |
|
481 | """return a "size" suitable for v1 serialization""" | |
457 | if not self.any_tracked: |
|
482 | if not self.any_tracked: | |
458 | # the object has no state to record, this is -currently- |
|
483 | # the object has no state to record, this is -currently- | |
459 | # unsupported |
|
484 | # unsupported | |
460 | raise RuntimeError('untracked item') |
|
485 | raise RuntimeError('untracked item') | |
461 | elif self.removed and self._p1_tracked and self._p2_info: |
|
486 | elif self.removed and self._p1_tracked and self._p2_info: | |
462 | return NONNORMAL |
|
487 | return NONNORMAL | |
463 | elif self._p2_info: |
|
488 | elif self._p2_info: | |
464 | return FROM_P2 |
|
489 | return FROM_P2 | |
465 | elif self.removed: |
|
490 | elif self.removed: | |
466 | return 0 |
|
491 | return 0 | |
467 | elif self.added: |
|
492 | elif self.added: | |
468 | return NONNORMAL |
|
493 | return NONNORMAL | |
469 | elif self._size is None: |
|
494 | elif self._size is None: | |
470 | return NONNORMAL |
|
495 | return NONNORMAL | |
471 | else: |
|
496 | else: | |
472 | return self._size |
|
497 | return self._size | |
473 |
|
498 | |||
474 | def v1_mtime(self): |
|
499 | def v1_mtime(self): | |
475 | """return a "mtime" suitable for v1 serialization""" |
|
500 | """return a "mtime" suitable for v1 serialization""" | |
476 | if not self.any_tracked: |
|
501 | if not self.any_tracked: | |
477 | # the object has no state to record, this is -currently- |
|
502 | # the object has no state to record, this is -currently- | |
478 | # unsupported |
|
503 | # unsupported | |
479 | raise RuntimeError('untracked item') |
|
504 | raise RuntimeError('untracked item') | |
480 | elif self.removed: |
|
505 | elif self.removed: | |
481 | return 0 |
|
506 | return 0 | |
482 | elif self._mtime is None: |
|
507 | elif self._mtime is None: | |
483 | return AMBIGUOUS_TIME |
|
508 | return AMBIGUOUS_TIME | |
484 | elif self._p2_info: |
|
509 | elif self._p2_info: | |
485 | return AMBIGUOUS_TIME |
|
510 | return AMBIGUOUS_TIME | |
486 | elif not self._p1_tracked: |
|
511 | elif not self._p1_tracked: | |
487 | return AMBIGUOUS_TIME |
|
512 | return AMBIGUOUS_TIME | |
488 | else: |
|
513 | else: | |
489 | return self._mtime |
|
514 | return self._mtime | |
490 |
|
515 | |||
491 | def need_delay(self, now): |
|
516 | def need_delay(self, now): | |
492 | """True if the stored mtime would be ambiguous with the current time""" |
|
517 | """True if the stored mtime would be ambiguous with the current time""" | |
493 | return self.v1_state() == b'n' and self.v1_mtime() == now |
|
518 | return self.v1_state() == b'n' and self.v1_mtime() == now | |
494 |
|
519 | |||
495 |
|
520 | |||
496 | def gettype(q): |
|
521 | def gettype(q): | |
497 | return int(q & 0xFFFF) |
|
522 | return int(q & 0xFFFF) | |
498 |
|
523 | |||
499 |
|
524 | |||
500 | class BaseIndexObject(object): |
|
525 | class BaseIndexObject(object): | |
501 | # Can I be passed to an algorithme implemented in Rust ? |
|
526 | # Can I be passed to an algorithme implemented in Rust ? | |
502 | rust_ext_compat = 0 |
|
527 | rust_ext_compat = 0 | |
503 | # Format of an index entry according to Python's `struct` language |
|
528 | # Format of an index entry according to Python's `struct` language | |
504 | index_format = revlog_constants.INDEX_ENTRY_V1 |
|
529 | index_format = revlog_constants.INDEX_ENTRY_V1 | |
505 | # Size of a C unsigned long long int, platform independent |
|
530 | # Size of a C unsigned long long int, platform independent | |
506 | big_int_size = struct.calcsize(b'>Q') |
|
531 | big_int_size = struct.calcsize(b'>Q') | |
507 | # Size of a C long int, platform independent |
|
532 | # Size of a C long int, platform independent | |
508 | int_size = struct.calcsize(b'>i') |
|
533 | int_size = struct.calcsize(b'>i') | |
509 | # An empty index entry, used as a default value to be overridden, or nullrev |
|
534 | # An empty index entry, used as a default value to be overridden, or nullrev | |
510 | null_item = ( |
|
535 | null_item = ( | |
511 | 0, |
|
536 | 0, | |
512 | 0, |
|
537 | 0, | |
513 | 0, |
|
538 | 0, | |
514 | -1, |
|
539 | -1, | |
515 | -1, |
|
540 | -1, | |
516 | -1, |
|
541 | -1, | |
517 | -1, |
|
542 | -1, | |
518 | sha1nodeconstants.nullid, |
|
543 | sha1nodeconstants.nullid, | |
519 | 0, |
|
544 | 0, | |
520 | 0, |
|
545 | 0, | |
521 | revlog_constants.COMP_MODE_INLINE, |
|
546 | revlog_constants.COMP_MODE_INLINE, | |
522 | revlog_constants.COMP_MODE_INLINE, |
|
547 | revlog_constants.COMP_MODE_INLINE, | |
523 | ) |
|
548 | ) | |
524 |
|
549 | |||
525 | @util.propertycache |
|
550 | @util.propertycache | |
526 | def entry_size(self): |
|
551 | def entry_size(self): | |
527 | return self.index_format.size |
|
552 | return self.index_format.size | |
528 |
|
553 | |||
529 | @property |
|
554 | @property | |
530 | def nodemap(self): |
|
555 | def nodemap(self): | |
531 | msg = b"index.nodemap is deprecated, use index.[has_node|rev|get_rev]" |
|
556 | msg = b"index.nodemap is deprecated, use index.[has_node|rev|get_rev]" | |
532 | util.nouideprecwarn(msg, b'5.3', stacklevel=2) |
|
557 | util.nouideprecwarn(msg, b'5.3', stacklevel=2) | |
533 | return self._nodemap |
|
558 | return self._nodemap | |
534 |
|
559 | |||
535 | @util.propertycache |
|
560 | @util.propertycache | |
536 | def _nodemap(self): |
|
561 | def _nodemap(self): | |
537 | nodemap = nodemaputil.NodeMap({sha1nodeconstants.nullid: nullrev}) |
|
562 | nodemap = nodemaputil.NodeMap({sha1nodeconstants.nullid: nullrev}) | |
538 | for r in range(0, len(self)): |
|
563 | for r in range(0, len(self)): | |
539 | n = self[r][7] |
|
564 | n = self[r][7] | |
540 | nodemap[n] = r |
|
565 | nodemap[n] = r | |
541 | return nodemap |
|
566 | return nodemap | |
542 |
|
567 | |||
543 | def has_node(self, node): |
|
568 | def has_node(self, node): | |
544 | """return True if the node exist in the index""" |
|
569 | """return True if the node exist in the index""" | |
545 | return node in self._nodemap |
|
570 | return node in self._nodemap | |
546 |
|
571 | |||
547 | def rev(self, node): |
|
572 | def rev(self, node): | |
548 | """return a revision for a node |
|
573 | """return a revision for a node | |
549 |
|
574 | |||
550 | If the node is unknown, raise a RevlogError""" |
|
575 | If the node is unknown, raise a RevlogError""" | |
551 | return self._nodemap[node] |
|
576 | return self._nodemap[node] | |
552 |
|
577 | |||
553 | def get_rev(self, node): |
|
578 | def get_rev(self, node): | |
554 | """return a revision for a node |
|
579 | """return a revision for a node | |
555 |
|
580 | |||
556 | If the node is unknown, return None""" |
|
581 | If the node is unknown, return None""" | |
557 | return self._nodemap.get(node) |
|
582 | return self._nodemap.get(node) | |
558 |
|
583 | |||
559 | def _stripnodes(self, start): |
|
584 | def _stripnodes(self, start): | |
560 | if '_nodemap' in vars(self): |
|
585 | if '_nodemap' in vars(self): | |
561 | for r in range(start, len(self)): |
|
586 | for r in range(start, len(self)): | |
562 | n = self[r][7] |
|
587 | n = self[r][7] | |
563 | del self._nodemap[n] |
|
588 | del self._nodemap[n] | |
564 |
|
589 | |||
565 | def clearcaches(self): |
|
590 | def clearcaches(self): | |
566 | self.__dict__.pop('_nodemap', None) |
|
591 | self.__dict__.pop('_nodemap', None) | |
567 |
|
592 | |||
568 | def __len__(self): |
|
593 | def __len__(self): | |
569 | return self._lgt + len(self._extra) |
|
594 | return self._lgt + len(self._extra) | |
570 |
|
595 | |||
571 | def append(self, tup): |
|
596 | def append(self, tup): | |
572 | if '_nodemap' in vars(self): |
|
597 | if '_nodemap' in vars(self): | |
573 | self._nodemap[tup[7]] = len(self) |
|
598 | self._nodemap[tup[7]] = len(self) | |
574 | data = self._pack_entry(len(self), tup) |
|
599 | data = self._pack_entry(len(self), tup) | |
575 | self._extra.append(data) |
|
600 | self._extra.append(data) | |
576 |
|
601 | |||
577 | def _pack_entry(self, rev, entry): |
|
602 | def _pack_entry(self, rev, entry): | |
578 | assert entry[8] == 0 |
|
603 | assert entry[8] == 0 | |
579 | assert entry[9] == 0 |
|
604 | assert entry[9] == 0 | |
580 | return self.index_format.pack(*entry[:8]) |
|
605 | return self.index_format.pack(*entry[:8]) | |
581 |
|
606 | |||
582 | def _check_index(self, i): |
|
607 | def _check_index(self, i): | |
583 | if not isinstance(i, int): |
|
608 | if not isinstance(i, int): | |
584 | raise TypeError(b"expecting int indexes") |
|
609 | raise TypeError(b"expecting int indexes") | |
585 | if i < 0 or i >= len(self): |
|
610 | if i < 0 or i >= len(self): | |
586 | raise IndexError |
|
611 | raise IndexError | |
587 |
|
612 | |||
588 | def __getitem__(self, i): |
|
613 | def __getitem__(self, i): | |
589 | if i == -1: |
|
614 | if i == -1: | |
590 | return self.null_item |
|
615 | return self.null_item | |
591 | self._check_index(i) |
|
616 | self._check_index(i) | |
592 | if i >= self._lgt: |
|
617 | if i >= self._lgt: | |
593 | data = self._extra[i - self._lgt] |
|
618 | data = self._extra[i - self._lgt] | |
594 | else: |
|
619 | else: | |
595 | index = self._calculate_index(i) |
|
620 | index = self._calculate_index(i) | |
596 | data = self._data[index : index + self.entry_size] |
|
621 | data = self._data[index : index + self.entry_size] | |
597 | r = self._unpack_entry(i, data) |
|
622 | r = self._unpack_entry(i, data) | |
598 | if self._lgt and i == 0: |
|
623 | if self._lgt and i == 0: | |
599 | offset = revlogutils.offset_type(0, gettype(r[0])) |
|
624 | offset = revlogutils.offset_type(0, gettype(r[0])) | |
600 | r = (offset,) + r[1:] |
|
625 | r = (offset,) + r[1:] | |
601 | return r |
|
626 | return r | |
602 |
|
627 | |||
603 | def _unpack_entry(self, rev, data): |
|
628 | def _unpack_entry(self, rev, data): | |
604 | r = self.index_format.unpack(data) |
|
629 | r = self.index_format.unpack(data) | |
605 | r = r + ( |
|
630 | r = r + ( | |
606 | 0, |
|
631 | 0, | |
607 | 0, |
|
632 | 0, | |
608 | revlog_constants.COMP_MODE_INLINE, |
|
633 | revlog_constants.COMP_MODE_INLINE, | |
609 | revlog_constants.COMP_MODE_INLINE, |
|
634 | revlog_constants.COMP_MODE_INLINE, | |
610 | ) |
|
635 | ) | |
611 | return r |
|
636 | return r | |
612 |
|
637 | |||
613 | def pack_header(self, header): |
|
638 | def pack_header(self, header): | |
614 | """pack header information as binary""" |
|
639 | """pack header information as binary""" | |
615 | v_fmt = revlog_constants.INDEX_HEADER |
|
640 | v_fmt = revlog_constants.INDEX_HEADER | |
616 | return v_fmt.pack(header) |
|
641 | return v_fmt.pack(header) | |
617 |
|
642 | |||
618 | def entry_binary(self, rev): |
|
643 | def entry_binary(self, rev): | |
619 | """return the raw binary string representing a revision""" |
|
644 | """return the raw binary string representing a revision""" | |
620 | entry = self[rev] |
|
645 | entry = self[rev] | |
621 | p = revlog_constants.INDEX_ENTRY_V1.pack(*entry[:8]) |
|
646 | p = revlog_constants.INDEX_ENTRY_V1.pack(*entry[:8]) | |
622 | if rev == 0: |
|
647 | if rev == 0: | |
623 | p = p[revlog_constants.INDEX_HEADER.size :] |
|
648 | p = p[revlog_constants.INDEX_HEADER.size :] | |
624 | return p |
|
649 | return p | |
625 |
|
650 | |||
626 |
|
651 | |||
627 | class IndexObject(BaseIndexObject): |
|
652 | class IndexObject(BaseIndexObject): | |
628 | def __init__(self, data): |
|
653 | def __init__(self, data): | |
629 | assert len(data) % self.entry_size == 0, ( |
|
654 | assert len(data) % self.entry_size == 0, ( | |
630 | len(data), |
|
655 | len(data), | |
631 | self.entry_size, |
|
656 | self.entry_size, | |
632 | len(data) % self.entry_size, |
|
657 | len(data) % self.entry_size, | |
633 | ) |
|
658 | ) | |
634 | self._data = data |
|
659 | self._data = data | |
635 | self._lgt = len(data) // self.entry_size |
|
660 | self._lgt = len(data) // self.entry_size | |
636 | self._extra = [] |
|
661 | self._extra = [] | |
637 |
|
662 | |||
638 | def _calculate_index(self, i): |
|
663 | def _calculate_index(self, i): | |
639 | return i * self.entry_size |
|
664 | return i * self.entry_size | |
640 |
|
665 | |||
641 | def __delitem__(self, i): |
|
666 | def __delitem__(self, i): | |
642 | if not isinstance(i, slice) or not i.stop == -1 or i.step is not None: |
|
667 | if not isinstance(i, slice) or not i.stop == -1 or i.step is not None: | |
643 | raise ValueError(b"deleting slices only supports a:-1 with step 1") |
|
668 | raise ValueError(b"deleting slices only supports a:-1 with step 1") | |
644 | i = i.start |
|
669 | i = i.start | |
645 | self._check_index(i) |
|
670 | self._check_index(i) | |
646 | self._stripnodes(i) |
|
671 | self._stripnodes(i) | |
647 | if i < self._lgt: |
|
672 | if i < self._lgt: | |
648 | self._data = self._data[: i * self.entry_size] |
|
673 | self._data = self._data[: i * self.entry_size] | |
649 | self._lgt = i |
|
674 | self._lgt = i | |
650 | self._extra = [] |
|
675 | self._extra = [] | |
651 | else: |
|
676 | else: | |
652 | self._extra = self._extra[: i - self._lgt] |
|
677 | self._extra = self._extra[: i - self._lgt] | |
653 |
|
678 | |||
654 |
|
679 | |||
655 | class PersistentNodeMapIndexObject(IndexObject): |
|
680 | class PersistentNodeMapIndexObject(IndexObject): | |
656 | """a Debug oriented class to test persistent nodemap |
|
681 | """a Debug oriented class to test persistent nodemap | |
657 |
|
682 | |||
658 | We need a simple python object to test API and higher level behavior. See |
|
683 | We need a simple python object to test API and higher level behavior. See | |
659 | the Rust implementation for more serious usage. This should be used only |
|
684 | the Rust implementation for more serious usage. This should be used only | |
660 | through the dedicated `devel.persistent-nodemap` config. |
|
685 | through the dedicated `devel.persistent-nodemap` config. | |
661 | """ |
|
686 | """ | |
662 |
|
687 | |||
663 | def nodemap_data_all(self): |
|
688 | def nodemap_data_all(self): | |
664 | """Return bytes containing a full serialization of a nodemap |
|
689 | """Return bytes containing a full serialization of a nodemap | |
665 |
|
690 | |||
666 | The nodemap should be valid for the full set of revisions in the |
|
691 | The nodemap should be valid for the full set of revisions in the | |
667 | index.""" |
|
692 | index.""" | |
668 | return nodemaputil.persistent_data(self) |
|
693 | return nodemaputil.persistent_data(self) | |
669 |
|
694 | |||
670 | def nodemap_data_incremental(self): |
|
695 | def nodemap_data_incremental(self): | |
671 | """Return bytes containing a incremental update to persistent nodemap |
|
696 | """Return bytes containing a incremental update to persistent nodemap | |
672 |
|
697 | |||
673 | This containst the data for an append-only update of the data provided |
|
698 | This containst the data for an append-only update of the data provided | |
674 | in the last call to `update_nodemap_data`. |
|
699 | in the last call to `update_nodemap_data`. | |
675 | """ |
|
700 | """ | |
676 | if self._nm_root is None: |
|
701 | if self._nm_root is None: | |
677 | return None |
|
702 | return None | |
678 | docket = self._nm_docket |
|
703 | docket = self._nm_docket | |
679 | changed, data = nodemaputil.update_persistent_data( |
|
704 | changed, data = nodemaputil.update_persistent_data( | |
680 | self, self._nm_root, self._nm_max_idx, self._nm_docket.tip_rev |
|
705 | self, self._nm_root, self._nm_max_idx, self._nm_docket.tip_rev | |
681 | ) |
|
706 | ) | |
682 |
|
707 | |||
683 | self._nm_root = self._nm_max_idx = self._nm_docket = None |
|
708 | self._nm_root = self._nm_max_idx = self._nm_docket = None | |
684 | return docket, changed, data |
|
709 | return docket, changed, data | |
685 |
|
710 | |||
686 | def update_nodemap_data(self, docket, nm_data): |
|
711 | def update_nodemap_data(self, docket, nm_data): | |
687 | """provide full block of persisted binary data for a nodemap |
|
712 | """provide full block of persisted binary data for a nodemap | |
688 |
|
713 | |||
689 | The data are expected to come from disk. See `nodemap_data_all` for a |
|
714 | The data are expected to come from disk. See `nodemap_data_all` for a | |
690 | produceur of such data.""" |
|
715 | produceur of such data.""" | |
691 | if nm_data is not None: |
|
716 | if nm_data is not None: | |
692 | self._nm_root, self._nm_max_idx = nodemaputil.parse_data(nm_data) |
|
717 | self._nm_root, self._nm_max_idx = nodemaputil.parse_data(nm_data) | |
693 | if self._nm_root: |
|
718 | if self._nm_root: | |
694 | self._nm_docket = docket |
|
719 | self._nm_docket = docket | |
695 | else: |
|
720 | else: | |
696 | self._nm_root = self._nm_max_idx = self._nm_docket = None |
|
721 | self._nm_root = self._nm_max_idx = self._nm_docket = None | |
697 |
|
722 | |||
698 |
|
723 | |||
699 | class InlinedIndexObject(BaseIndexObject): |
|
724 | class InlinedIndexObject(BaseIndexObject): | |
700 | def __init__(self, data, inline=0): |
|
725 | def __init__(self, data, inline=0): | |
701 | self._data = data |
|
726 | self._data = data | |
702 | self._lgt = self._inline_scan(None) |
|
727 | self._lgt = self._inline_scan(None) | |
703 | self._inline_scan(self._lgt) |
|
728 | self._inline_scan(self._lgt) | |
704 | self._extra = [] |
|
729 | self._extra = [] | |
705 |
|
730 | |||
706 | def _inline_scan(self, lgt): |
|
731 | def _inline_scan(self, lgt): | |
707 | off = 0 |
|
732 | off = 0 | |
708 | if lgt is not None: |
|
733 | if lgt is not None: | |
709 | self._offsets = [0] * lgt |
|
734 | self._offsets = [0] * lgt | |
710 | count = 0 |
|
735 | count = 0 | |
711 | while off <= len(self._data) - self.entry_size: |
|
736 | while off <= len(self._data) - self.entry_size: | |
712 | start = off + self.big_int_size |
|
737 | start = off + self.big_int_size | |
713 | (s,) = struct.unpack( |
|
738 | (s,) = struct.unpack( | |
714 | b'>i', |
|
739 | b'>i', | |
715 | self._data[start : start + self.int_size], |
|
740 | self._data[start : start + self.int_size], | |
716 | ) |
|
741 | ) | |
717 | if lgt is not None: |
|
742 | if lgt is not None: | |
718 | self._offsets[count] = off |
|
743 | self._offsets[count] = off | |
719 | count += 1 |
|
744 | count += 1 | |
720 | off += self.entry_size + s |
|
745 | off += self.entry_size + s | |
721 | if off != len(self._data): |
|
746 | if off != len(self._data): | |
722 | raise ValueError(b"corrupted data") |
|
747 | raise ValueError(b"corrupted data") | |
723 | return count |
|
748 | return count | |
724 |
|
749 | |||
725 | def __delitem__(self, i): |
|
750 | def __delitem__(self, i): | |
726 | if not isinstance(i, slice) or not i.stop == -1 or i.step is not None: |
|
751 | if not isinstance(i, slice) or not i.stop == -1 or i.step is not None: | |
727 | raise ValueError(b"deleting slices only supports a:-1 with step 1") |
|
752 | raise ValueError(b"deleting slices only supports a:-1 with step 1") | |
728 | i = i.start |
|
753 | i = i.start | |
729 | self._check_index(i) |
|
754 | self._check_index(i) | |
730 | self._stripnodes(i) |
|
755 | self._stripnodes(i) | |
731 | if i < self._lgt: |
|
756 | if i < self._lgt: | |
732 | self._offsets = self._offsets[:i] |
|
757 | self._offsets = self._offsets[:i] | |
733 | self._lgt = i |
|
758 | self._lgt = i | |
734 | self._extra = [] |
|
759 | self._extra = [] | |
735 | else: |
|
760 | else: | |
736 | self._extra = self._extra[: i - self._lgt] |
|
761 | self._extra = self._extra[: i - self._lgt] | |
737 |
|
762 | |||
738 | def _calculate_index(self, i): |
|
763 | def _calculate_index(self, i): | |
739 | return self._offsets[i] |
|
764 | return self._offsets[i] | |
740 |
|
765 | |||
741 |
|
766 | |||
742 | def parse_index2(data, inline, revlogv2=False): |
|
767 | def parse_index2(data, inline, revlogv2=False): | |
743 | if not inline: |
|
768 | if not inline: | |
744 | cls = IndexObject2 if revlogv2 else IndexObject |
|
769 | cls = IndexObject2 if revlogv2 else IndexObject | |
745 | return cls(data), None |
|
770 | return cls(data), None | |
746 | cls = InlinedIndexObject |
|
771 | cls = InlinedIndexObject | |
747 | return cls(data, inline), (0, data) |
|
772 | return cls(data, inline), (0, data) | |
748 |
|
773 | |||
749 |
|
774 | |||
750 | def parse_index_cl_v2(data): |
|
775 | def parse_index_cl_v2(data): | |
751 | return IndexChangelogV2(data), None |
|
776 | return IndexChangelogV2(data), None | |
752 |
|
777 | |||
753 |
|
778 | |||
754 | class IndexObject2(IndexObject): |
|
779 | class IndexObject2(IndexObject): | |
755 | index_format = revlog_constants.INDEX_ENTRY_V2 |
|
780 | index_format = revlog_constants.INDEX_ENTRY_V2 | |
756 |
|
781 | |||
757 | def replace_sidedata_info( |
|
782 | def replace_sidedata_info( | |
758 | self, |
|
783 | self, | |
759 | rev, |
|
784 | rev, | |
760 | sidedata_offset, |
|
785 | sidedata_offset, | |
761 | sidedata_length, |
|
786 | sidedata_length, | |
762 | offset_flags, |
|
787 | offset_flags, | |
763 | compression_mode, |
|
788 | compression_mode, | |
764 | ): |
|
789 | ): | |
765 | """ |
|
790 | """ | |
766 | Replace an existing index entry's sidedata offset and length with new |
|
791 | Replace an existing index entry's sidedata offset and length with new | |
767 | ones. |
|
792 | ones. | |
768 | This cannot be used outside of the context of sidedata rewriting, |
|
793 | This cannot be used outside of the context of sidedata rewriting, | |
769 | inside the transaction that creates the revision `rev`. |
|
794 | inside the transaction that creates the revision `rev`. | |
770 | """ |
|
795 | """ | |
771 | if rev < 0: |
|
796 | if rev < 0: | |
772 | raise KeyError |
|
797 | raise KeyError | |
773 | self._check_index(rev) |
|
798 | self._check_index(rev) | |
774 | if rev < self._lgt: |
|
799 | if rev < self._lgt: | |
775 | msg = b"cannot rewrite entries outside of this transaction" |
|
800 | msg = b"cannot rewrite entries outside of this transaction" | |
776 | raise KeyError(msg) |
|
801 | raise KeyError(msg) | |
777 | else: |
|
802 | else: | |
778 | entry = list(self[rev]) |
|
803 | entry = list(self[rev]) | |
779 | entry[0] = offset_flags |
|
804 | entry[0] = offset_flags | |
780 | entry[8] = sidedata_offset |
|
805 | entry[8] = sidedata_offset | |
781 | entry[9] = sidedata_length |
|
806 | entry[9] = sidedata_length | |
782 | entry[11] = compression_mode |
|
807 | entry[11] = compression_mode | |
783 | entry = tuple(entry) |
|
808 | entry = tuple(entry) | |
784 | new = self._pack_entry(rev, entry) |
|
809 | new = self._pack_entry(rev, entry) | |
785 | self._extra[rev - self._lgt] = new |
|
810 | self._extra[rev - self._lgt] = new | |
786 |
|
811 | |||
787 | def _unpack_entry(self, rev, data): |
|
812 | def _unpack_entry(self, rev, data): | |
788 | data = self.index_format.unpack(data) |
|
813 | data = self.index_format.unpack(data) | |
789 | entry = data[:10] |
|
814 | entry = data[:10] | |
790 | data_comp = data[10] & 3 |
|
815 | data_comp = data[10] & 3 | |
791 | sidedata_comp = (data[10] & (3 << 2)) >> 2 |
|
816 | sidedata_comp = (data[10] & (3 << 2)) >> 2 | |
792 | return entry + (data_comp, sidedata_comp) |
|
817 | return entry + (data_comp, sidedata_comp) | |
793 |
|
818 | |||
794 | def _pack_entry(self, rev, entry): |
|
819 | def _pack_entry(self, rev, entry): | |
795 | data = entry[:10] |
|
820 | data = entry[:10] | |
796 | data_comp = entry[10] & 3 |
|
821 | data_comp = entry[10] & 3 | |
797 | sidedata_comp = (entry[11] & 3) << 2 |
|
822 | sidedata_comp = (entry[11] & 3) << 2 | |
798 | data += (data_comp | sidedata_comp,) |
|
823 | data += (data_comp | sidedata_comp,) | |
799 |
|
824 | |||
800 | return self.index_format.pack(*data) |
|
825 | return self.index_format.pack(*data) | |
801 |
|
826 | |||
802 | def entry_binary(self, rev): |
|
827 | def entry_binary(self, rev): | |
803 | """return the raw binary string representing a revision""" |
|
828 | """return the raw binary string representing a revision""" | |
804 | entry = self[rev] |
|
829 | entry = self[rev] | |
805 | return self._pack_entry(rev, entry) |
|
830 | return self._pack_entry(rev, entry) | |
806 |
|
831 | |||
807 | def pack_header(self, header): |
|
832 | def pack_header(self, header): | |
808 | """pack header information as binary""" |
|
833 | """pack header information as binary""" | |
809 | msg = 'version header should go in the docket, not the index: %d' |
|
834 | msg = 'version header should go in the docket, not the index: %d' | |
810 | msg %= header |
|
835 | msg %= header | |
811 | raise error.ProgrammingError(msg) |
|
836 | raise error.ProgrammingError(msg) | |
812 |
|
837 | |||
813 |
|
838 | |||
814 | class IndexChangelogV2(IndexObject2): |
|
839 | class IndexChangelogV2(IndexObject2): | |
815 | index_format = revlog_constants.INDEX_ENTRY_CL_V2 |
|
840 | index_format = revlog_constants.INDEX_ENTRY_CL_V2 | |
816 |
|
841 | |||
817 | def _unpack_entry(self, rev, data, r=True): |
|
842 | def _unpack_entry(self, rev, data, r=True): | |
818 | items = self.index_format.unpack(data) |
|
843 | items = self.index_format.unpack(data) | |
819 | entry = items[:3] + (rev, rev) + items[3:8] |
|
844 | entry = items[:3] + (rev, rev) + items[3:8] | |
820 | data_comp = items[8] & 3 |
|
845 | data_comp = items[8] & 3 | |
821 | sidedata_comp = (items[8] >> 2) & 3 |
|
846 | sidedata_comp = (items[8] >> 2) & 3 | |
822 | return entry + (data_comp, sidedata_comp) |
|
847 | return entry + (data_comp, sidedata_comp) | |
823 |
|
848 | |||
824 | def _pack_entry(self, rev, entry): |
|
849 | def _pack_entry(self, rev, entry): | |
825 | assert entry[3] == rev, entry[3] |
|
850 | assert entry[3] == rev, entry[3] | |
826 | assert entry[4] == rev, entry[4] |
|
851 | assert entry[4] == rev, entry[4] | |
827 | data = entry[:3] + entry[5:10] |
|
852 | data = entry[:3] + entry[5:10] | |
828 | data_comp = entry[10] & 3 |
|
853 | data_comp = entry[10] & 3 | |
829 | sidedata_comp = (entry[11] & 3) << 2 |
|
854 | sidedata_comp = (entry[11] & 3) << 2 | |
830 | data += (data_comp | sidedata_comp,) |
|
855 | data += (data_comp | sidedata_comp,) | |
831 | return self.index_format.pack(*data) |
|
856 | return self.index_format.pack(*data) | |
832 |
|
857 | |||
833 |
|
858 | |||
834 | def parse_index_devel_nodemap(data, inline): |
|
859 | def parse_index_devel_nodemap(data, inline): | |
835 | """like parse_index2, but alway return a PersistentNodeMapIndexObject""" |
|
860 | """like parse_index2, but alway return a PersistentNodeMapIndexObject""" | |
836 | return PersistentNodeMapIndexObject(data), None |
|
861 | return PersistentNodeMapIndexObject(data), None | |
837 |
|
862 | |||
838 |
|
863 | |||
839 | def parse_dirstate(dmap, copymap, st): |
|
864 | def parse_dirstate(dmap, copymap, st): | |
840 | parents = [st[:20], st[20:40]] |
|
865 | parents = [st[:20], st[20:40]] | |
841 | # dereference fields so they will be local in loop |
|
866 | # dereference fields so they will be local in loop | |
842 | format = b">cllll" |
|
867 | format = b">cllll" | |
843 | e_size = struct.calcsize(format) |
|
868 | e_size = struct.calcsize(format) | |
844 | pos1 = 40 |
|
869 | pos1 = 40 | |
845 | l = len(st) |
|
870 | l = len(st) | |
846 |
|
871 | |||
847 | # the inner loop |
|
872 | # the inner loop | |
848 | while pos1 < l: |
|
873 | while pos1 < l: | |
849 | pos2 = pos1 + e_size |
|
874 | pos2 = pos1 + e_size | |
850 | e = _unpack(b">cllll", st[pos1:pos2]) # a literal here is faster |
|
875 | e = _unpack(b">cllll", st[pos1:pos2]) # a literal here is faster | |
851 | pos1 = pos2 + e[4] |
|
876 | pos1 = pos2 + e[4] | |
852 | f = st[pos2:pos1] |
|
877 | f = st[pos2:pos1] | |
853 | if b'\0' in f: |
|
878 | if b'\0' in f: | |
854 | f, c = f.split(b'\0') |
|
879 | f, c = f.split(b'\0') | |
855 | copymap[f] = c |
|
880 | copymap[f] = c | |
856 | dmap[f] = DirstateItem.from_v1_data(*e[:4]) |
|
881 | dmap[f] = DirstateItem.from_v1_data(*e[:4]) | |
857 | return parents |
|
882 | return parents | |
858 |
|
883 | |||
859 |
|
884 | |||
860 | def pack_dirstate(dmap, copymap, pl, now): |
|
885 | def pack_dirstate(dmap, copymap, pl, now): | |
861 | now = int(now) |
|
886 | now = int(now) | |
862 | cs = stringio() |
|
887 | cs = stringio() | |
863 | write = cs.write |
|
888 | write = cs.write | |
864 | write(b"".join(pl)) |
|
889 | write(b"".join(pl)) | |
865 | for f, e in pycompat.iteritems(dmap): |
|
890 | for f, e in pycompat.iteritems(dmap): | |
866 | if e.need_delay(now): |
|
891 | if e.need_delay(now): | |
867 | # The file was last modified "simultaneously" with the current |
|
892 | # The file was last modified "simultaneously" with the current | |
868 | # write to dirstate (i.e. within the same second for file- |
|
893 | # write to dirstate (i.e. within the same second for file- | |
869 | # systems with a granularity of 1 sec). This commonly happens |
|
894 | # systems with a granularity of 1 sec). This commonly happens | |
870 | # for at least a couple of files on 'update'. |
|
895 | # for at least a couple of files on 'update'. | |
871 | # The user could change the file without changing its size |
|
896 | # The user could change the file without changing its size | |
872 | # within the same second. Invalidate the file's mtime in |
|
897 | # within the same second. Invalidate the file's mtime in | |
873 | # dirstate, forcing future 'status' calls to compare the |
|
898 | # dirstate, forcing future 'status' calls to compare the | |
874 | # contents of the file if the size is the same. This prevents |
|
899 | # contents of the file if the size is the same. This prevents | |
875 | # mistakenly treating such files as clean. |
|
900 | # mistakenly treating such files as clean. | |
876 | e.set_possibly_dirty() |
|
901 | e.set_possibly_dirty() | |
877 |
|
902 | |||
878 | if f in copymap: |
|
903 | if f in copymap: | |
879 | f = b"%s\0%s" % (f, copymap[f]) |
|
904 | f = b"%s\0%s" % (f, copymap[f]) | |
880 | e = _pack( |
|
905 | e = _pack( | |
881 | b">cllll", |
|
906 | b">cllll", | |
882 | e.v1_state(), |
|
907 | e.v1_state(), | |
883 | e.v1_mode(), |
|
908 | e.v1_mode(), | |
884 | e.v1_size(), |
|
909 | e.v1_size(), | |
885 | e.v1_mtime(), |
|
910 | e.v1_mtime(), | |
886 | len(f), |
|
911 | len(f), | |
887 | ) |
|
912 | ) | |
888 | write(e) |
|
913 | write(e) | |
889 | write(f) |
|
914 | write(f) | |
890 | return cs.getvalue() |
|
915 | return cs.getvalue() |
@@ -1,621 +1,637 b'' | |||||
1 | use crate::dirstate_tree::on_disk::DirstateV2ParseError; |
|
1 | use crate::dirstate_tree::on_disk::DirstateV2ParseError; | |
2 | use crate::errors::HgError; |
|
2 | use crate::errors::HgError; | |
3 | use bitflags::bitflags; |
|
3 | use bitflags::bitflags; | |
4 | use std::convert::{TryFrom, TryInto}; |
|
4 | use std::convert::{TryFrom, TryInto}; | |
5 | use std::fs; |
|
5 | use std::fs; | |
6 | use std::io; |
|
6 | use std::io; | |
7 | use std::time::{SystemTime, UNIX_EPOCH}; |
|
7 | use std::time::{SystemTime, UNIX_EPOCH}; | |
8 |
|
8 | |||
9 | #[derive(Copy, Clone, Debug, Eq, PartialEq)] |
|
9 | #[derive(Copy, Clone, Debug, Eq, PartialEq)] | |
10 | pub enum EntryState { |
|
10 | pub enum EntryState { | |
11 | Normal, |
|
11 | Normal, | |
12 | Added, |
|
12 | Added, | |
13 | Removed, |
|
13 | Removed, | |
14 | Merged, |
|
14 | Merged, | |
15 | } |
|
15 | } | |
16 |
|
16 | |||
17 | /// The C implementation uses all signed types. This will be an issue |
|
17 | /// The C implementation uses all signed types. This will be an issue | |
18 | /// either when 4GB+ source files are commonplace or in 2038, whichever |
|
18 | /// either when 4GB+ source files are commonplace or in 2038, whichever | |
19 | /// comes first. |
|
19 | /// comes first. | |
20 | #[derive(Debug, PartialEq, Copy, Clone)] |
|
20 | #[derive(Debug, PartialEq, Copy, Clone)] | |
21 | pub struct DirstateEntry { |
|
21 | pub struct DirstateEntry { | |
22 | pub(crate) flags: Flags, |
|
22 | pub(crate) flags: Flags, | |
23 | mode_size: Option<(u32, u32)>, |
|
23 | mode_size: Option<(u32, u32)>, | |
24 | mtime: Option<u32>, |
|
24 | mtime: Option<u32>, | |
25 | } |
|
25 | } | |
26 |
|
26 | |||
27 | bitflags! { |
|
27 | bitflags! { | |
28 | pub(crate) struct Flags: u8 { |
|
28 | pub(crate) struct Flags: u8 { | |
29 | const WDIR_TRACKED = 1 << 0; |
|
29 | const WDIR_TRACKED = 1 << 0; | |
30 | const P1_TRACKED = 1 << 1; |
|
30 | const P1_TRACKED = 1 << 1; | |
31 | const P2_INFO = 1 << 2; |
|
31 | const P2_INFO = 1 << 2; | |
32 | const HAS_FALLBACK_EXEC = 1 << 3; |
|
32 | const HAS_FALLBACK_EXEC = 1 << 3; | |
33 | const FALLBACK_EXEC = 1 << 4; |
|
33 | const FALLBACK_EXEC = 1 << 4; | |
34 | const HAS_FALLBACK_SYMLINK = 1 << 5; |
|
34 | const HAS_FALLBACK_SYMLINK = 1 << 5; | |
35 | const FALLBACK_SYMLINK = 1 << 6; |
|
35 | const FALLBACK_SYMLINK = 1 << 6; | |
36 | } |
|
36 | } | |
37 | } |
|
37 | } | |
38 |
|
38 | |||
39 | /// A Unix timestamp with nanoseconds precision |
|
39 | /// A Unix timestamp with nanoseconds precision | |
40 | #[derive(Copy, Clone)] |
|
40 | #[derive(Copy, Clone)] | |
41 | pub struct TruncatedTimestamp { |
|
41 | pub struct TruncatedTimestamp { | |
42 | truncated_seconds: u32, |
|
42 | truncated_seconds: u32, | |
43 | /// Always in the `0 .. 1_000_000_000` range. |
|
43 | /// Always in the `0 .. 1_000_000_000` range. | |
44 | nanoseconds: u32, |
|
44 | nanoseconds: u32, | |
45 | } |
|
45 | } | |
46 |
|
46 | |||
47 | impl TruncatedTimestamp { |
|
47 | impl TruncatedTimestamp { | |
48 | /// Constructs from a timestamp potentially outside of the supported range, |
|
48 | /// Constructs from a timestamp potentially outside of the supported range, | |
49 | /// and truncate the seconds components to its lower 31 bits. |
|
49 | /// and truncate the seconds components to its lower 31 bits. | |
50 | /// |
|
50 | /// | |
51 | /// Panics if the nanoseconds components is not in the expected range. |
|
51 | /// Panics if the nanoseconds components is not in the expected range. | |
52 | pub fn new_truncate(seconds: i64, nanoseconds: u32) -> Self { |
|
52 | pub fn new_truncate(seconds: i64, nanoseconds: u32) -> Self { | |
53 | assert!(nanoseconds < NSEC_PER_SEC); |
|
53 | assert!(nanoseconds < NSEC_PER_SEC); | |
54 | Self { |
|
54 | Self { | |
55 | truncated_seconds: seconds as u32 & RANGE_MASK_31BIT, |
|
55 | truncated_seconds: seconds as u32 & RANGE_MASK_31BIT, | |
56 | nanoseconds, |
|
56 | nanoseconds, | |
57 | } |
|
57 | } | |
58 | } |
|
58 | } | |
59 |
|
59 | |||
60 | /// Construct from components. Returns an error if they are not in the |
|
60 | /// Construct from components. Returns an error if they are not in the | |
61 | /// expcted range. |
|
61 | /// expcted range. | |
62 | pub fn from_already_truncated( |
|
62 | pub fn from_already_truncated( | |
63 | truncated_seconds: u32, |
|
63 | truncated_seconds: u32, | |
64 | nanoseconds: u32, |
|
64 | nanoseconds: u32, | |
65 | ) -> Result<Self, DirstateV2ParseError> { |
|
65 | ) -> Result<Self, DirstateV2ParseError> { | |
66 | if truncated_seconds & !RANGE_MASK_31BIT == 0 |
|
66 | if truncated_seconds & !RANGE_MASK_31BIT == 0 | |
67 | && nanoseconds < NSEC_PER_SEC |
|
67 | && nanoseconds < NSEC_PER_SEC | |
68 | { |
|
68 | { | |
69 | Ok(Self { |
|
69 | Ok(Self { | |
70 | truncated_seconds, |
|
70 | truncated_seconds, | |
71 | nanoseconds, |
|
71 | nanoseconds, | |
72 | }) |
|
72 | }) | |
73 | } else { |
|
73 | } else { | |
74 | Err(DirstateV2ParseError) |
|
74 | Err(DirstateV2ParseError) | |
75 | } |
|
75 | } | |
76 | } |
|
76 | } | |
77 |
|
77 | |||
78 | pub fn for_mtime_of(metadata: &fs::Metadata) -> io::Result<Self> { |
|
78 | pub fn for_mtime_of(metadata: &fs::Metadata) -> io::Result<Self> { | |
79 | #[cfg(unix)] |
|
79 | #[cfg(unix)] | |
80 | { |
|
80 | { | |
81 | use std::os::unix::fs::MetadataExt; |
|
81 | use std::os::unix::fs::MetadataExt; | |
82 | let seconds = metadata.mtime(); |
|
82 | let seconds = metadata.mtime(); | |
83 | // i64Β -> u32 with value always in the `0 .. NSEC_PER_SEC` range |
|
83 | // i64Β -> u32 with value always in the `0 .. NSEC_PER_SEC` range | |
84 | let nanoseconds = metadata.mtime_nsec().try_into().unwrap(); |
|
84 | let nanoseconds = metadata.mtime_nsec().try_into().unwrap(); | |
85 | Ok(Self::new_truncate(seconds, nanoseconds)) |
|
85 | Ok(Self::new_truncate(seconds, nanoseconds)) | |
86 | } |
|
86 | } | |
87 | #[cfg(not(unix))] |
|
87 | #[cfg(not(unix))] | |
88 | { |
|
88 | { | |
89 | metadata.modified().map(Self::from) |
|
89 | metadata.modified().map(Self::from) | |
90 | } |
|
90 | } | |
91 | } |
|
91 | } | |
92 |
|
92 | |||
93 | /// The lower 31 bits of the number of seconds since the epoch. |
|
93 | /// The lower 31 bits of the number of seconds since the epoch. | |
94 | pub fn truncated_seconds(&self) -> u32 { |
|
94 | pub fn truncated_seconds(&self) -> u32 { | |
95 | self.truncated_seconds |
|
95 | self.truncated_seconds | |
96 | } |
|
96 | } | |
97 |
|
97 | |||
98 | /// The sub-second component of this timestamp, in nanoseconds. |
|
98 | /// The sub-second component of this timestamp, in nanoseconds. | |
99 | /// Always in the `0 .. 1_000_000_000` range. |
|
99 | /// Always in the `0 .. 1_000_000_000` range. | |
100 | /// |
|
100 | /// | |
101 | /// This timestamp is after `(seconds, 0)` by this many nanoseconds. |
|
101 | /// This timestamp is after `(seconds, 0)` by this many nanoseconds. | |
102 | pub fn nanoseconds(&self) -> u32 { |
|
102 | pub fn nanoseconds(&self) -> u32 { | |
103 | self.nanoseconds |
|
103 | self.nanoseconds | |
104 | } |
|
104 | } | |
105 |
|
105 | |||
106 | /// Returns whether two timestamps are equal modulo 2**31 seconds. |
|
106 | /// Returns whether two timestamps are equal modulo 2**31 seconds. | |
107 | /// |
|
107 | /// | |
108 | /// If this returns `true`, the original values converted from `SystemTime` |
|
108 | /// If this returns `true`, the original values converted from `SystemTime` | |
109 | /// or given to `new_truncate` were very likely equal. A false positive is |
|
109 | /// or given to `new_truncate` were very likely equal. A false positive is | |
110 | /// possible if they were exactly a multiple of 2**31 seconds apart (around |
|
110 | /// possible if they were exactly a multiple of 2**31 seconds apart (around | |
111 | /// 68 years). This is deemed very unlikely to happen by chance, especially |
|
111 | /// 68 years). This is deemed very unlikely to happen by chance, especially | |
112 | /// on filesystems that support sub-second precision. |
|
112 | /// on filesystems that support sub-second precision. | |
113 | /// |
|
113 | /// | |
114 | /// If someone is manipulating the modification times of some files to |
|
114 | /// If someone is manipulating the modification times of some files to | |
115 | /// intentionally make `hg status` return incorrect results, not truncating |
|
115 | /// intentionally make `hg status` return incorrect results, not truncating | |
116 | /// wouldnβt help much since they can set exactly the expected timestamp. |
|
116 | /// wouldnβt help much since they can set exactly the expected timestamp. | |
117 | pub fn very_likely_equal(self, other: Self) -> bool { |
|
117 | pub fn very_likely_equal(self, other: Self) -> bool { | |
118 | self.truncated_seconds == other.truncated_seconds |
|
118 | self.truncated_seconds == other.truncated_seconds | |
119 | && self.nanoseconds == other.nanoseconds |
|
119 | && self.nanoseconds == other.nanoseconds | |
120 | } |
|
120 | } | |
121 |
|
121 | |||
122 | pub fn very_likely_equal_to_mtime_of( |
|
122 | pub fn very_likely_equal_to_mtime_of( | |
123 | self, |
|
123 | self, | |
124 | metadata: &fs::Metadata, |
|
124 | metadata: &fs::Metadata, | |
125 | ) -> io::Result<bool> { |
|
125 | ) -> io::Result<bool> { | |
126 | Ok(self.very_likely_equal(Self::for_mtime_of(metadata)?)) |
|
126 | Ok(self.very_likely_equal(Self::for_mtime_of(metadata)?)) | |
127 | } |
|
127 | } | |
128 | } |
|
128 | } | |
129 |
|
129 | |||
130 | impl From<SystemTime> for TruncatedTimestamp { |
|
130 | impl From<SystemTime> for TruncatedTimestamp { | |
131 | fn from(system_time: SystemTime) -> Self { |
|
131 | fn from(system_time: SystemTime) -> Self { | |
132 | // On Unix, `SystemTime` is a wrapper for the `timespec` C struct: |
|
132 | // On Unix, `SystemTime` is a wrapper for the `timespec` C struct: | |
133 | // https://www.gnu.org/software/libc/manual/html_node/Time-Types.html#index-struct-timespec |
|
133 | // https://www.gnu.org/software/libc/manual/html_node/Time-Types.html#index-struct-timespec | |
134 | // We want to effectively access its fields, but the Rust standard |
|
134 | // We want to effectively access its fields, but the Rust standard | |
135 | // library does not expose them. The best we can do is: |
|
135 | // library does not expose them. The best we can do is: | |
136 | let seconds; |
|
136 | let seconds; | |
137 | let nanoseconds; |
|
137 | let nanoseconds; | |
138 | match system_time.duration_since(UNIX_EPOCH) { |
|
138 | match system_time.duration_since(UNIX_EPOCH) { | |
139 | Ok(duration) => { |
|
139 | Ok(duration) => { | |
140 | seconds = duration.as_secs() as i64; |
|
140 | seconds = duration.as_secs() as i64; | |
141 | nanoseconds = duration.subsec_nanos(); |
|
141 | nanoseconds = duration.subsec_nanos(); | |
142 | } |
|
142 | } | |
143 | Err(error) => { |
|
143 | Err(error) => { | |
144 | // `system_time` is before `UNIX_EPOCH`. |
|
144 | // `system_time` is before `UNIX_EPOCH`. | |
145 | // We need to undo this algorithm: |
|
145 | // We need to undo this algorithm: | |
146 | // https://github.com/rust-lang/rust/blob/6bed1f0bc3cc50c10aab26d5f94b16a00776b8a5/library/std/src/sys/unix/time.rs#L40-L41 |
|
146 | // https://github.com/rust-lang/rust/blob/6bed1f0bc3cc50c10aab26d5f94b16a00776b8a5/library/std/src/sys/unix/time.rs#L40-L41 | |
147 | let negative = error.duration(); |
|
147 | let negative = error.duration(); | |
148 | let negative_secs = negative.as_secs() as i64; |
|
148 | let negative_secs = negative.as_secs() as i64; | |
149 | let negative_nanos = negative.subsec_nanos(); |
|
149 | let negative_nanos = negative.subsec_nanos(); | |
150 | if negative_nanos == 0 { |
|
150 | if negative_nanos == 0 { | |
151 | seconds = -negative_secs; |
|
151 | seconds = -negative_secs; | |
152 | nanoseconds = 0; |
|
152 | nanoseconds = 0; | |
153 | } else { |
|
153 | } else { | |
154 | // For example if `system_time` was 4.3Β seconds before |
|
154 | // For example if `system_time` was 4.3Β seconds before | |
155 | // the Unix epoch we get a Duration that represents |
|
155 | // the Unix epoch we get a Duration that represents | |
156 | // `(-4, -0.3)` but we want `(-5, +0.7)`: |
|
156 | // `(-4, -0.3)` but we want `(-5, +0.7)`: | |
157 | seconds = -1 - negative_secs; |
|
157 | seconds = -1 - negative_secs; | |
158 | nanoseconds = NSEC_PER_SEC - negative_nanos; |
|
158 | nanoseconds = NSEC_PER_SEC - negative_nanos; | |
159 | } |
|
159 | } | |
160 | } |
|
160 | } | |
161 | }; |
|
161 | }; | |
162 | Self::new_truncate(seconds, nanoseconds) |
|
162 | Self::new_truncate(seconds, nanoseconds) | |
163 | } |
|
163 | } | |
164 | } |
|
164 | } | |
165 |
|
165 | |||
166 | const NSEC_PER_SEC: u32 = 1_000_000_000; |
|
166 | const NSEC_PER_SEC: u32 = 1_000_000_000; | |
167 | const RANGE_MASK_31BIT: u32 = 0x7FFF_FFFF; |
|
167 | const RANGE_MASK_31BIT: u32 = 0x7FFF_FFFF; | |
168 |
|
168 | |||
169 | pub const MTIME_UNSET: i32 = -1; |
|
169 | pub const MTIME_UNSET: i32 = -1; | |
170 |
|
170 | |||
171 | /// A `DirstateEntry` with a size of `-2` means that it was merged from the |
|
171 | /// A `DirstateEntry` with a size of `-2` means that it was merged from the | |
172 | /// other parent. This allows revert to pick the right status back during a |
|
172 | /// other parent. This allows revert to pick the right status back during a | |
173 | /// merge. |
|
173 | /// merge. | |
174 | pub const SIZE_FROM_OTHER_PARENT: i32 = -2; |
|
174 | pub const SIZE_FROM_OTHER_PARENT: i32 = -2; | |
175 | /// A special value used for internal representation of special case in |
|
175 | /// A special value used for internal representation of special case in | |
176 | /// dirstate v1 format. |
|
176 | /// dirstate v1 format. | |
177 | pub const SIZE_NON_NORMAL: i32 = -1; |
|
177 | pub const SIZE_NON_NORMAL: i32 = -1; | |
178 |
|
178 | |||
179 | impl DirstateEntry { |
|
179 | impl DirstateEntry { | |
180 | pub fn from_v2_data( |
|
180 | pub fn from_v2_data( | |
181 | wdir_tracked: bool, |
|
181 | wdir_tracked: bool, | |
182 | p1_tracked: bool, |
|
182 | p1_tracked: bool, | |
183 | p2_info: bool, |
|
183 | p2_info: bool, | |
184 | mode_size: Option<(u32, u32)>, |
|
184 | mode_size: Option<(u32, u32)>, | |
185 | mtime: Option<u32>, |
|
185 | mtime: Option<u32>, | |
186 | fallback_exec: Option<bool>, |
|
186 | fallback_exec: Option<bool>, | |
187 | fallback_symlink: Option<bool>, |
|
187 | fallback_symlink: Option<bool>, | |
188 | ) -> Self { |
|
188 | ) -> Self { | |
189 | if let Some((mode, size)) = mode_size { |
|
189 | if let Some((mode, size)) = mode_size { | |
190 | // TODO: return an error for out of range values? |
|
190 | // TODO: return an error for out of range values? | |
191 | assert!(mode & !RANGE_MASK_31BIT == 0); |
|
191 | assert!(mode & !RANGE_MASK_31BIT == 0); | |
192 | assert!(size & !RANGE_MASK_31BIT == 0); |
|
192 | assert!(size & !RANGE_MASK_31BIT == 0); | |
193 | } |
|
193 | } | |
194 | if let Some(mtime) = mtime { |
|
194 | if let Some(mtime) = mtime { | |
195 | assert!(mtime & !RANGE_MASK_31BIT == 0); |
|
195 | assert!(mtime & !RANGE_MASK_31BIT == 0); | |
196 | } |
|
196 | } | |
197 | let mut flags = Flags::empty(); |
|
197 | let mut flags = Flags::empty(); | |
198 | flags.set(Flags::WDIR_TRACKED, wdir_tracked); |
|
198 | flags.set(Flags::WDIR_TRACKED, wdir_tracked); | |
199 | flags.set(Flags::P1_TRACKED, p1_tracked); |
|
199 | flags.set(Flags::P1_TRACKED, p1_tracked); | |
200 | flags.set(Flags::P2_INFO, p2_info); |
|
200 | flags.set(Flags::P2_INFO, p2_info); | |
201 | if let Some(exec) = fallback_exec { |
|
201 | if let Some(exec) = fallback_exec { | |
202 | flags.insert(Flags::HAS_FALLBACK_EXEC); |
|
202 | flags.insert(Flags::HAS_FALLBACK_EXEC); | |
203 | if exec { |
|
203 | if exec { | |
204 | flags.insert(Flags::FALLBACK_EXEC); |
|
204 | flags.insert(Flags::FALLBACK_EXEC); | |
205 | } |
|
205 | } | |
206 | } |
|
206 | } | |
207 | if let Some(exec) = fallback_symlink { |
|
207 | if let Some(exec) = fallback_symlink { | |
208 | flags.insert(Flags::HAS_FALLBACK_SYMLINK); |
|
208 | flags.insert(Flags::HAS_FALLBACK_SYMLINK); | |
209 | if exec { |
|
209 | if exec { | |
210 | flags.insert(Flags::FALLBACK_SYMLINK); |
|
210 | flags.insert(Flags::FALLBACK_SYMLINK); | |
211 | } |
|
211 | } | |
212 | } |
|
212 | } | |
213 | Self { |
|
213 | Self { | |
214 | flags, |
|
214 | flags, | |
215 | mode_size, |
|
215 | mode_size, | |
216 | mtime, |
|
216 | mtime, | |
217 | } |
|
217 | } | |
218 | } |
|
218 | } | |
219 |
|
219 | |||
220 | pub fn from_v1_data( |
|
220 | pub fn from_v1_data( | |
221 | state: EntryState, |
|
221 | state: EntryState, | |
222 | mode: i32, |
|
222 | mode: i32, | |
223 | size: i32, |
|
223 | size: i32, | |
224 | mtime: i32, |
|
224 | mtime: i32, | |
225 | ) -> Self { |
|
225 | ) -> Self { | |
226 | match state { |
|
226 | match state { | |
227 | EntryState::Normal => { |
|
227 | EntryState::Normal => { | |
228 | if size == SIZE_FROM_OTHER_PARENT { |
|
228 | if size == SIZE_FROM_OTHER_PARENT { | |
229 | Self { |
|
229 | Self { | |
230 | // might be missing P1_TRACKED |
|
230 | // might be missing P1_TRACKED | |
231 | flags: Flags::WDIR_TRACKED | Flags::P2_INFO, |
|
231 | flags: Flags::WDIR_TRACKED | Flags::P2_INFO, | |
232 | mode_size: None, |
|
232 | mode_size: None, | |
233 | mtime: None, |
|
233 | mtime: None, | |
234 | } |
|
234 | } | |
235 | } else if size == SIZE_NON_NORMAL { |
|
235 | } else if size == SIZE_NON_NORMAL { | |
236 | Self { |
|
236 | Self { | |
237 | flags: Flags::WDIR_TRACKED | Flags::P1_TRACKED, |
|
237 | flags: Flags::WDIR_TRACKED | Flags::P1_TRACKED, | |
238 | mode_size: None, |
|
238 | mode_size: None, | |
239 | mtime: None, |
|
239 | mtime: None, | |
240 | } |
|
240 | } | |
241 | } else if mtime == MTIME_UNSET { |
|
241 | } else if mtime == MTIME_UNSET { | |
242 | // TODO:Β return an error for negative values? |
|
242 | // TODO:Β return an error for negative values? | |
243 | let mode = u32::try_from(mode).unwrap(); |
|
243 | let mode = u32::try_from(mode).unwrap(); | |
244 | let size = u32::try_from(size).unwrap(); |
|
244 | let size = u32::try_from(size).unwrap(); | |
245 | Self { |
|
245 | Self { | |
246 | flags: Flags::WDIR_TRACKED | Flags::P1_TRACKED, |
|
246 | flags: Flags::WDIR_TRACKED | Flags::P1_TRACKED, | |
247 | mode_size: Some((mode, size)), |
|
247 | mode_size: Some((mode, size)), | |
248 | mtime: None, |
|
248 | mtime: None, | |
249 | } |
|
249 | } | |
250 | } else { |
|
250 | } else { | |
251 | // TODO:Β return an error for negative values? |
|
251 | // TODO:Β return an error for negative values? | |
252 | let mode = u32::try_from(mode).unwrap(); |
|
252 | let mode = u32::try_from(mode).unwrap(); | |
253 | let size = u32::try_from(size).unwrap(); |
|
253 | let size = u32::try_from(size).unwrap(); | |
254 | let mtime = u32::try_from(mtime).unwrap(); |
|
254 | let mtime = u32::try_from(mtime).unwrap(); | |
255 | Self { |
|
255 | Self { | |
256 | flags: Flags::WDIR_TRACKED | Flags::P1_TRACKED, |
|
256 | flags: Flags::WDIR_TRACKED | Flags::P1_TRACKED, | |
257 | mode_size: Some((mode, size)), |
|
257 | mode_size: Some((mode, size)), | |
258 | mtime: Some(mtime), |
|
258 | mtime: Some(mtime), | |
259 | } |
|
259 | } | |
260 | } |
|
260 | } | |
261 | } |
|
261 | } | |
262 | EntryState::Added => Self { |
|
262 | EntryState::Added => Self { | |
263 | flags: Flags::WDIR_TRACKED, |
|
263 | flags: Flags::WDIR_TRACKED, | |
264 | mode_size: None, |
|
264 | mode_size: None, | |
265 | mtime: None, |
|
265 | mtime: None, | |
266 | }, |
|
266 | }, | |
267 | EntryState::Removed => Self { |
|
267 | EntryState::Removed => Self { | |
268 | flags: if size == SIZE_NON_NORMAL { |
|
268 | flags: if size == SIZE_NON_NORMAL { | |
269 | Flags::P1_TRACKED | Flags::P2_INFO |
|
269 | Flags::P1_TRACKED | Flags::P2_INFO | |
270 | } else if size == SIZE_FROM_OTHER_PARENT { |
|
270 | } else if size == SIZE_FROM_OTHER_PARENT { | |
271 | // We donβt know if P1_TRACKED should be set (file history) |
|
271 | // We donβt know if P1_TRACKED should be set (file history) | |
272 | Flags::P2_INFO |
|
272 | Flags::P2_INFO | |
273 | } else { |
|
273 | } else { | |
274 | Flags::P1_TRACKED |
|
274 | Flags::P1_TRACKED | |
275 | }, |
|
275 | }, | |
276 | mode_size: None, |
|
276 | mode_size: None, | |
277 | mtime: None, |
|
277 | mtime: None, | |
278 | }, |
|
278 | }, | |
279 | EntryState::Merged => Self { |
|
279 | EntryState::Merged => Self { | |
280 | flags: Flags::WDIR_TRACKED |
|
280 | flags: Flags::WDIR_TRACKED | |
281 | | Flags::P1_TRACKED // might not be true because of rename ? |
|
281 | | Flags::P1_TRACKED // might not be true because of rename ? | |
282 | | Flags::P2_INFO, // might not be true because of rename ? |
|
282 | | Flags::P2_INFO, // might not be true because of rename ? | |
283 | mode_size: None, |
|
283 | mode_size: None, | |
284 | mtime: None, |
|
284 | mtime: None, | |
285 | }, |
|
285 | }, | |
286 | } |
|
286 | } | |
287 | } |
|
287 | } | |
288 |
|
288 | |||
289 | /// Creates a new entry in "removed" state. |
|
289 | /// Creates a new entry in "removed" state. | |
290 | /// |
|
290 | /// | |
291 | /// `size` is expected to be zero, `SIZE_NON_NORMAL`, or |
|
291 | /// `size` is expected to be zero, `SIZE_NON_NORMAL`, or | |
292 | /// `SIZE_FROM_OTHER_PARENT` |
|
292 | /// `SIZE_FROM_OTHER_PARENT` | |
293 | pub fn new_removed(size: i32) -> Self { |
|
293 | pub fn new_removed(size: i32) -> Self { | |
294 | Self::from_v1_data(EntryState::Removed, 0, size, 0) |
|
294 | Self::from_v1_data(EntryState::Removed, 0, size, 0) | |
295 | } |
|
295 | } | |
296 |
|
296 | |||
297 | pub fn tracked(&self) -> bool { |
|
297 | pub fn tracked(&self) -> bool { | |
298 | self.flags.contains(Flags::WDIR_TRACKED) |
|
298 | self.flags.contains(Flags::WDIR_TRACKED) | |
299 | } |
|
299 | } | |
300 |
|
300 | |||
301 | pub fn p1_tracked(&self) -> bool { |
|
301 | pub fn p1_tracked(&self) -> bool { | |
302 | self.flags.contains(Flags::P1_TRACKED) |
|
302 | self.flags.contains(Flags::P1_TRACKED) | |
303 | } |
|
303 | } | |
304 |
|
304 | |||
305 | fn in_either_parent(&self) -> bool { |
|
305 | fn in_either_parent(&self) -> bool { | |
306 | self.flags.intersects(Flags::P1_TRACKED | Flags::P2_INFO) |
|
306 | self.flags.intersects(Flags::P1_TRACKED | Flags::P2_INFO) | |
307 | } |
|
307 | } | |
308 |
|
308 | |||
309 | pub fn removed(&self) -> bool { |
|
309 | pub fn removed(&self) -> bool { | |
310 | self.in_either_parent() && !self.flags.contains(Flags::WDIR_TRACKED) |
|
310 | self.in_either_parent() && !self.flags.contains(Flags::WDIR_TRACKED) | |
311 | } |
|
311 | } | |
312 |
|
312 | |||
313 | pub fn p2_info(&self) -> bool { |
|
313 | pub fn p2_info(&self) -> bool { | |
314 | self.flags.contains(Flags::WDIR_TRACKED | Flags::P2_INFO) |
|
314 | self.flags.contains(Flags::WDIR_TRACKED | Flags::P2_INFO) | |
315 | } |
|
315 | } | |
316 |
|
316 | |||
317 | pub fn added(&self) -> bool { |
|
317 | pub fn added(&self) -> bool { | |
318 | self.flags.contains(Flags::WDIR_TRACKED) && !self.in_either_parent() |
|
318 | self.flags.contains(Flags::WDIR_TRACKED) && !self.in_either_parent() | |
319 | } |
|
319 | } | |
320 |
|
320 | |||
321 | pub fn maybe_clean(&self) -> bool { |
|
321 | pub fn maybe_clean(&self) -> bool { | |
322 | if !self.flags.contains(Flags::WDIR_TRACKED) { |
|
322 | if !self.flags.contains(Flags::WDIR_TRACKED) { | |
323 | false |
|
323 | false | |
324 | } else if !self.flags.contains(Flags::P1_TRACKED) { |
|
324 | } else if !self.flags.contains(Flags::P1_TRACKED) { | |
325 | false |
|
325 | false | |
326 | } else if self.flags.contains(Flags::P2_INFO) { |
|
326 | } else if self.flags.contains(Flags::P2_INFO) { | |
327 | false |
|
327 | false | |
328 | } else { |
|
328 | } else { | |
329 | true |
|
329 | true | |
330 | } |
|
330 | } | |
331 | } |
|
331 | } | |
332 |
|
332 | |||
333 | pub fn any_tracked(&self) -> bool { |
|
333 | pub fn any_tracked(&self) -> bool { | |
334 | self.flags.intersects( |
|
334 | self.flags.intersects( | |
335 | Flags::WDIR_TRACKED | Flags::P1_TRACKED | Flags::P2_INFO, |
|
335 | Flags::WDIR_TRACKED | Flags::P1_TRACKED | Flags::P2_INFO, | |
336 | ) |
|
336 | ) | |
337 | } |
|
337 | } | |
338 |
|
338 | |||
339 | /// Returns `(wdir_tracked, p1_tracked, p2_info, mode_size, mtime)` |
|
339 | /// Returns `(wdir_tracked, p1_tracked, p2_info, mode_size, mtime)` | |
340 | pub(crate) fn v2_data( |
|
340 | pub(crate) fn v2_data( | |
341 | &self, |
|
341 | &self, | |
342 | ) -> (bool, bool, bool, Option<(u32, u32)>, Option<u32>) { |
|
342 | ) -> ( | |
|
343 | bool, | |||
|
344 | bool, | |||
|
345 | bool, | |||
|
346 | Option<(u32, u32)>, | |||
|
347 | Option<u32>, | |||
|
348 | Option<bool>, | |||
|
349 | Option<bool>, | |||
|
350 | ) { | |||
343 | if !self.any_tracked() { |
|
351 | if !self.any_tracked() { | |
344 | // TODO: return an Option instead? |
|
352 | // TODO: return an Option instead? | |
345 | panic!("Accessing v1_state of an untracked DirstateEntry") |
|
353 | panic!("Accessing v1_state of an untracked DirstateEntry") | |
346 | } |
|
354 | } | |
347 | let wdir_tracked = self.flags.contains(Flags::WDIR_TRACKED); |
|
355 | let wdir_tracked = self.flags.contains(Flags::WDIR_TRACKED); | |
348 | let p1_tracked = self.flags.contains(Flags::P1_TRACKED); |
|
356 | let p1_tracked = self.flags.contains(Flags::P1_TRACKED); | |
349 | let p2_info = self.flags.contains(Flags::P2_INFO); |
|
357 | let p2_info = self.flags.contains(Flags::P2_INFO); | |
350 | let mode_size = self.mode_size; |
|
358 | let mode_size = self.mode_size; | |
351 | let mtime = self.mtime; |
|
359 | let mtime = self.mtime; | |
352 | (wdir_tracked, p1_tracked, p2_info, mode_size, mtime) |
|
360 | ( | |
|
361 | wdir_tracked, | |||
|
362 | p1_tracked, | |||
|
363 | p2_info, | |||
|
364 | mode_size, | |||
|
365 | mtime, | |||
|
366 | self.get_fallback_exec(), | |||
|
367 | self.get_fallback_symlink(), | |||
|
368 | ) | |||
353 | } |
|
369 | } | |
354 |
|
370 | |||
355 | fn v1_state(&self) -> EntryState { |
|
371 | fn v1_state(&self) -> EntryState { | |
356 | if !self.any_tracked() { |
|
372 | if !self.any_tracked() { | |
357 | // TODO: return an Option instead? |
|
373 | // TODO: return an Option instead? | |
358 | panic!("Accessing v1_state of an untracked DirstateEntry") |
|
374 | panic!("Accessing v1_state of an untracked DirstateEntry") | |
359 | } |
|
375 | } | |
360 | if self.removed() { |
|
376 | if self.removed() { | |
361 | EntryState::Removed |
|
377 | EntryState::Removed | |
362 | } else if self |
|
378 | } else if self | |
363 | .flags |
|
379 | .flags | |
364 | .contains(Flags::WDIR_TRACKED | Flags::P1_TRACKED | Flags::P2_INFO) |
|
380 | .contains(Flags::WDIR_TRACKED | Flags::P1_TRACKED | Flags::P2_INFO) | |
365 | { |
|
381 | { | |
366 | EntryState::Merged |
|
382 | EntryState::Merged | |
367 | } else if self.added() { |
|
383 | } else if self.added() { | |
368 | EntryState::Added |
|
384 | EntryState::Added | |
369 | } else { |
|
385 | } else { | |
370 | EntryState::Normal |
|
386 | EntryState::Normal | |
371 | } |
|
387 | } | |
372 | } |
|
388 | } | |
373 |
|
389 | |||
374 | fn v1_mode(&self) -> i32 { |
|
390 | fn v1_mode(&self) -> i32 { | |
375 | if let Some((mode, _size)) = self.mode_size { |
|
391 | if let Some((mode, _size)) = self.mode_size { | |
376 | i32::try_from(mode).unwrap() |
|
392 | i32::try_from(mode).unwrap() | |
377 | } else { |
|
393 | } else { | |
378 | 0 |
|
394 | 0 | |
379 | } |
|
395 | } | |
380 | } |
|
396 | } | |
381 |
|
397 | |||
382 | fn v1_size(&self) -> i32 { |
|
398 | fn v1_size(&self) -> i32 { | |
383 | if !self.any_tracked() { |
|
399 | if !self.any_tracked() { | |
384 | // TODO: return an Option instead? |
|
400 | // TODO: return an Option instead? | |
385 | panic!("Accessing v1_size of an untracked DirstateEntry") |
|
401 | panic!("Accessing v1_size of an untracked DirstateEntry") | |
386 | } |
|
402 | } | |
387 | if self.removed() |
|
403 | if self.removed() | |
388 | && self.flags.contains(Flags::P1_TRACKED | Flags::P2_INFO) |
|
404 | && self.flags.contains(Flags::P1_TRACKED | Flags::P2_INFO) | |
389 | { |
|
405 | { | |
390 | SIZE_NON_NORMAL |
|
406 | SIZE_NON_NORMAL | |
391 | } else if self.flags.contains(Flags::P2_INFO) { |
|
407 | } else if self.flags.contains(Flags::P2_INFO) { | |
392 | SIZE_FROM_OTHER_PARENT |
|
408 | SIZE_FROM_OTHER_PARENT | |
393 | } else if self.removed() { |
|
409 | } else if self.removed() { | |
394 | 0 |
|
410 | 0 | |
395 | } else if self.added() { |
|
411 | } else if self.added() { | |
396 | SIZE_NON_NORMAL |
|
412 | SIZE_NON_NORMAL | |
397 | } else if let Some((_mode, size)) = self.mode_size { |
|
413 | } else if let Some((_mode, size)) = self.mode_size { | |
398 | i32::try_from(size).unwrap() |
|
414 | i32::try_from(size).unwrap() | |
399 | } else { |
|
415 | } else { | |
400 | SIZE_NON_NORMAL |
|
416 | SIZE_NON_NORMAL | |
401 | } |
|
417 | } | |
402 | } |
|
418 | } | |
403 |
|
419 | |||
404 | fn v1_mtime(&self) -> i32 { |
|
420 | fn v1_mtime(&self) -> i32 { | |
405 | if !self.any_tracked() { |
|
421 | if !self.any_tracked() { | |
406 | // TODO: return an Option instead? |
|
422 | // TODO: return an Option instead? | |
407 | panic!("Accessing v1_mtime of an untracked DirstateEntry") |
|
423 | panic!("Accessing v1_mtime of an untracked DirstateEntry") | |
408 | } |
|
424 | } | |
409 | if self.removed() { |
|
425 | if self.removed() { | |
410 | 0 |
|
426 | 0 | |
411 | } else if self.flags.contains(Flags::P2_INFO) { |
|
427 | } else if self.flags.contains(Flags::P2_INFO) { | |
412 | MTIME_UNSET |
|
428 | MTIME_UNSET | |
413 | } else if !self.flags.contains(Flags::P1_TRACKED) { |
|
429 | } else if !self.flags.contains(Flags::P1_TRACKED) { | |
414 | MTIME_UNSET |
|
430 | MTIME_UNSET | |
415 | } else if let Some(mtime) = self.mtime { |
|
431 | } else if let Some(mtime) = self.mtime { | |
416 | i32::try_from(mtime).unwrap() |
|
432 | i32::try_from(mtime).unwrap() | |
417 | } else { |
|
433 | } else { | |
418 | MTIME_UNSET |
|
434 | MTIME_UNSET | |
419 | } |
|
435 | } | |
420 | } |
|
436 | } | |
421 |
|
437 | |||
422 | // TODO: return `Option<EntryState>`? None when `!self.any_tracked` |
|
438 | // TODO: return `Option<EntryState>`? None when `!self.any_tracked` | |
423 | pub fn state(&self) -> EntryState { |
|
439 | pub fn state(&self) -> EntryState { | |
424 | self.v1_state() |
|
440 | self.v1_state() | |
425 | } |
|
441 | } | |
426 |
|
442 | |||
427 | // TODO: return Option? |
|
443 | // TODO: return Option? | |
428 | pub fn mode(&self) -> i32 { |
|
444 | pub fn mode(&self) -> i32 { | |
429 | self.v1_mode() |
|
445 | self.v1_mode() | |
430 | } |
|
446 | } | |
431 |
|
447 | |||
432 | // TODO: return Option? |
|
448 | // TODO: return Option? | |
433 | pub fn size(&self) -> i32 { |
|
449 | pub fn size(&self) -> i32 { | |
434 | self.v1_size() |
|
450 | self.v1_size() | |
435 | } |
|
451 | } | |
436 |
|
452 | |||
437 | // TODO: return Option? |
|
453 | // TODO: return Option? | |
438 | pub fn mtime(&self) -> i32 { |
|
454 | pub fn mtime(&self) -> i32 { | |
439 | self.v1_mtime() |
|
455 | self.v1_mtime() | |
440 | } |
|
456 | } | |
441 |
|
457 | |||
442 | pub fn get_fallback_exec(&self) -> Option<bool> { |
|
458 | pub fn get_fallback_exec(&self) -> Option<bool> { | |
443 | if self.flags.contains(Flags::HAS_FALLBACK_EXEC) { |
|
459 | if self.flags.contains(Flags::HAS_FALLBACK_EXEC) { | |
444 | Some(self.flags.contains(Flags::FALLBACK_EXEC)) |
|
460 | Some(self.flags.contains(Flags::FALLBACK_EXEC)) | |
445 | } else { |
|
461 | } else { | |
446 | None |
|
462 | None | |
447 | } |
|
463 | } | |
448 | } |
|
464 | } | |
449 |
|
465 | |||
450 | pub fn set_fallback_exec(&mut self, value: Option<bool>) { |
|
466 | pub fn set_fallback_exec(&mut self, value: Option<bool>) { | |
451 | match value { |
|
467 | match value { | |
452 | None => { |
|
468 | None => { | |
453 | self.flags.remove(Flags::HAS_FALLBACK_EXEC); |
|
469 | self.flags.remove(Flags::HAS_FALLBACK_EXEC); | |
454 | self.flags.remove(Flags::FALLBACK_EXEC); |
|
470 | self.flags.remove(Flags::FALLBACK_EXEC); | |
455 | } |
|
471 | } | |
456 | Some(exec) => { |
|
472 | Some(exec) => { | |
457 | self.flags.insert(Flags::HAS_FALLBACK_EXEC); |
|
473 | self.flags.insert(Flags::HAS_FALLBACK_EXEC); | |
458 | if exec { |
|
474 | if exec { | |
459 | self.flags.insert(Flags::FALLBACK_EXEC); |
|
475 | self.flags.insert(Flags::FALLBACK_EXEC); | |
460 | } |
|
476 | } | |
461 | } |
|
477 | } | |
462 | } |
|
478 | } | |
463 | } |
|
479 | } | |
464 |
|
480 | |||
465 | pub fn get_fallback_symlink(&self) -> Option<bool> { |
|
481 | pub fn get_fallback_symlink(&self) -> Option<bool> { | |
466 | if self.flags.contains(Flags::HAS_FALLBACK_SYMLINK) { |
|
482 | if self.flags.contains(Flags::HAS_FALLBACK_SYMLINK) { | |
467 | Some(self.flags.contains(Flags::FALLBACK_SYMLINK)) |
|
483 | Some(self.flags.contains(Flags::FALLBACK_SYMLINK)) | |
468 | } else { |
|
484 | } else { | |
469 | None |
|
485 | None | |
470 | } |
|
486 | } | |
471 | } |
|
487 | } | |
472 |
|
488 | |||
473 | pub fn set_fallback_symlink(&mut self, value: Option<bool>) { |
|
489 | pub fn set_fallback_symlink(&mut self, value: Option<bool>) { | |
474 | match value { |
|
490 | match value { | |
475 | None => { |
|
491 | None => { | |
476 | self.flags.remove(Flags::HAS_FALLBACK_SYMLINK); |
|
492 | self.flags.remove(Flags::HAS_FALLBACK_SYMLINK); | |
477 | self.flags.remove(Flags::FALLBACK_SYMLINK); |
|
493 | self.flags.remove(Flags::FALLBACK_SYMLINK); | |
478 | } |
|
494 | } | |
479 | Some(symlink) => { |
|
495 | Some(symlink) => { | |
480 | self.flags.insert(Flags::HAS_FALLBACK_SYMLINK); |
|
496 | self.flags.insert(Flags::HAS_FALLBACK_SYMLINK); | |
481 | if symlink { |
|
497 | if symlink { | |
482 | self.flags.insert(Flags::FALLBACK_SYMLINK); |
|
498 | self.flags.insert(Flags::FALLBACK_SYMLINK); | |
483 | } |
|
499 | } | |
484 | } |
|
500 | } | |
485 | } |
|
501 | } | |
486 | } |
|
502 | } | |
487 |
|
503 | |||
488 | pub fn drop_merge_data(&mut self) { |
|
504 | pub fn drop_merge_data(&mut self) { | |
489 | if self.flags.contains(Flags::P2_INFO) { |
|
505 | if self.flags.contains(Flags::P2_INFO) { | |
490 | self.flags.remove(Flags::P2_INFO); |
|
506 | self.flags.remove(Flags::P2_INFO); | |
491 | self.mode_size = None; |
|
507 | self.mode_size = None; | |
492 | self.mtime = None; |
|
508 | self.mtime = None; | |
493 | } |
|
509 | } | |
494 | } |
|
510 | } | |
495 |
|
511 | |||
496 | pub fn set_possibly_dirty(&mut self) { |
|
512 | pub fn set_possibly_dirty(&mut self) { | |
497 | self.mtime = None |
|
513 | self.mtime = None | |
498 | } |
|
514 | } | |
499 |
|
515 | |||
500 | pub fn set_clean(&mut self, mode: u32, size: u32, mtime: u32) { |
|
516 | pub fn set_clean(&mut self, mode: u32, size: u32, mtime: u32) { | |
501 | let size = size & RANGE_MASK_31BIT; |
|
517 | let size = size & RANGE_MASK_31BIT; | |
502 | let mtime = mtime & RANGE_MASK_31BIT; |
|
518 | let mtime = mtime & RANGE_MASK_31BIT; | |
503 | self.flags.insert(Flags::WDIR_TRACKED | Flags::P1_TRACKED); |
|
519 | self.flags.insert(Flags::WDIR_TRACKED | Flags::P1_TRACKED); | |
504 | self.mode_size = Some((mode, size)); |
|
520 | self.mode_size = Some((mode, size)); | |
505 | self.mtime = Some(mtime); |
|
521 | self.mtime = Some(mtime); | |
506 | } |
|
522 | } | |
507 |
|
523 | |||
508 | pub fn set_tracked(&mut self) { |
|
524 | pub fn set_tracked(&mut self) { | |
509 | self.flags.insert(Flags::WDIR_TRACKED); |
|
525 | self.flags.insert(Flags::WDIR_TRACKED); | |
510 | // `set_tracked` is replacing various `normallookup` call. So we mark |
|
526 | // `set_tracked` is replacing various `normallookup` call. So we mark | |
511 | // the files as needing lookup |
|
527 | // the files as needing lookup | |
512 | // |
|
528 | // | |
513 | // Consider dropping this in the future in favor of something less |
|
529 | // Consider dropping this in the future in favor of something less | |
514 | // broad. |
|
530 | // broad. | |
515 | self.mtime = None; |
|
531 | self.mtime = None; | |
516 | } |
|
532 | } | |
517 |
|
533 | |||
518 | pub fn set_untracked(&mut self) { |
|
534 | pub fn set_untracked(&mut self) { | |
519 | self.flags.remove(Flags::WDIR_TRACKED); |
|
535 | self.flags.remove(Flags::WDIR_TRACKED); | |
520 | self.mode_size = None; |
|
536 | self.mode_size = None; | |
521 | self.mtime = None; |
|
537 | self.mtime = None; | |
522 | } |
|
538 | } | |
523 |
|
539 | |||
524 | /// Returns `(state, mode, size, mtime)` for the puprose of serialization |
|
540 | /// Returns `(state, mode, size, mtime)` for the puprose of serialization | |
525 | /// in the dirstate-v1 format. |
|
541 | /// in the dirstate-v1 format. | |
526 | /// |
|
542 | /// | |
527 | /// This includes marker values such as `mtime == -1`. In the future we may |
|
543 | /// This includes marker values such as `mtime == -1`. In the future we may | |
528 | /// want to not represent these cases that way in memory, but serialization |
|
544 | /// want to not represent these cases that way in memory, but serialization | |
529 | /// will need to keep the same format. |
|
545 | /// will need to keep the same format. | |
530 | pub fn v1_data(&self) -> (u8, i32, i32, i32) { |
|
546 | pub fn v1_data(&self) -> (u8, i32, i32, i32) { | |
531 | ( |
|
547 | ( | |
532 | self.v1_state().into(), |
|
548 | self.v1_state().into(), | |
533 | self.v1_mode(), |
|
549 | self.v1_mode(), | |
534 | self.v1_size(), |
|
550 | self.v1_size(), | |
535 | self.v1_mtime(), |
|
551 | self.v1_mtime(), | |
536 | ) |
|
552 | ) | |
537 | } |
|
553 | } | |
538 |
|
554 | |||
539 | pub(crate) fn is_from_other_parent(&self) -> bool { |
|
555 | pub(crate) fn is_from_other_parent(&self) -> bool { | |
540 | self.state() == EntryState::Normal |
|
556 | self.state() == EntryState::Normal | |
541 | && self.size() == SIZE_FROM_OTHER_PARENT |
|
557 | && self.size() == SIZE_FROM_OTHER_PARENT | |
542 | } |
|
558 | } | |
543 |
|
559 | |||
544 | // TODO: other platforms |
|
560 | // TODO: other platforms | |
545 | #[cfg(unix)] |
|
561 | #[cfg(unix)] | |
546 | pub fn mode_changed( |
|
562 | pub fn mode_changed( | |
547 | &self, |
|
563 | &self, | |
548 | filesystem_metadata: &std::fs::Metadata, |
|
564 | filesystem_metadata: &std::fs::Metadata, | |
549 | ) -> bool { |
|
565 | ) -> bool { | |
550 | use std::os::unix::fs::MetadataExt; |
|
566 | use std::os::unix::fs::MetadataExt; | |
551 | const EXEC_BIT_MASK: u32 = 0o100; |
|
567 | const EXEC_BIT_MASK: u32 = 0o100; | |
552 | let dirstate_exec_bit = (self.mode() as u32) & EXEC_BIT_MASK; |
|
568 | let dirstate_exec_bit = (self.mode() as u32) & EXEC_BIT_MASK; | |
553 | let fs_exec_bit = filesystem_metadata.mode() & EXEC_BIT_MASK; |
|
569 | let fs_exec_bit = filesystem_metadata.mode() & EXEC_BIT_MASK; | |
554 | dirstate_exec_bit != fs_exec_bit |
|
570 | dirstate_exec_bit != fs_exec_bit | |
555 | } |
|
571 | } | |
556 |
|
572 | |||
557 | /// Returns a `(state, mode, size, mtime)` tuple as for |
|
573 | /// Returns a `(state, mode, size, mtime)` tuple as for | |
558 | /// `DirstateMapMethods::debug_iter`. |
|
574 | /// `DirstateMapMethods::debug_iter`. | |
559 | pub fn debug_tuple(&self) -> (u8, i32, i32, i32) { |
|
575 | pub fn debug_tuple(&self) -> (u8, i32, i32, i32) { | |
560 | (self.state().into(), self.mode(), self.size(), self.mtime()) |
|
576 | (self.state().into(), self.mode(), self.size(), self.mtime()) | |
561 | } |
|
577 | } | |
562 |
|
578 | |||
563 | pub fn mtime_is_ambiguous(&self, now: i32) -> bool { |
|
579 | pub fn mtime_is_ambiguous(&self, now: i32) -> bool { | |
564 | self.state() == EntryState::Normal && self.mtime() == now |
|
580 | self.state() == EntryState::Normal && self.mtime() == now | |
565 | } |
|
581 | } | |
566 |
|
582 | |||
567 | pub fn clear_ambiguous_mtime(&mut self, now: i32) -> bool { |
|
583 | pub fn clear_ambiguous_mtime(&mut self, now: i32) -> bool { | |
568 | let ambiguous = self.mtime_is_ambiguous(now); |
|
584 | let ambiguous = self.mtime_is_ambiguous(now); | |
569 | if ambiguous { |
|
585 | if ambiguous { | |
570 | // The file was last modified "simultaneously" with the current |
|
586 | // The file was last modified "simultaneously" with the current | |
571 | // write to dirstate (i.e. within the same second for file- |
|
587 | // write to dirstate (i.e. within the same second for file- | |
572 | // systems with a granularity of 1 sec). This commonly happens |
|
588 | // systems with a granularity of 1 sec). This commonly happens | |
573 | // for at least a couple of files on 'update'. |
|
589 | // for at least a couple of files on 'update'. | |
574 | // The user could change the file without changing its size |
|
590 | // The user could change the file without changing its size | |
575 | // within the same second. Invalidate the file's mtime in |
|
591 | // within the same second. Invalidate the file's mtime in | |
576 | // dirstate, forcing future 'status' calls to compare the |
|
592 | // dirstate, forcing future 'status' calls to compare the | |
577 | // contents of the file if the size is the same. This prevents |
|
593 | // contents of the file if the size is the same. This prevents | |
578 | // mistakenly treating such files as clean. |
|
594 | // mistakenly treating such files as clean. | |
579 | self.set_possibly_dirty() |
|
595 | self.set_possibly_dirty() | |
580 | } |
|
596 | } | |
581 | ambiguous |
|
597 | ambiguous | |
582 | } |
|
598 | } | |
583 | } |
|
599 | } | |
584 |
|
600 | |||
585 | impl EntryState { |
|
601 | impl EntryState { | |
586 | pub fn is_tracked(self) -> bool { |
|
602 | pub fn is_tracked(self) -> bool { | |
587 | use EntryState::*; |
|
603 | use EntryState::*; | |
588 | match self { |
|
604 | match self { | |
589 | Normal | Added | Merged => true, |
|
605 | Normal | Added | Merged => true, | |
590 | Removed => false, |
|
606 | Removed => false, | |
591 | } |
|
607 | } | |
592 | } |
|
608 | } | |
593 | } |
|
609 | } | |
594 |
|
610 | |||
595 | impl TryFrom<u8> for EntryState { |
|
611 | impl TryFrom<u8> for EntryState { | |
596 | type Error = HgError; |
|
612 | type Error = HgError; | |
597 |
|
613 | |||
598 | fn try_from(value: u8) -> Result<Self, Self::Error> { |
|
614 | fn try_from(value: u8) -> Result<Self, Self::Error> { | |
599 | match value { |
|
615 | match value { | |
600 | b'n' => Ok(EntryState::Normal), |
|
616 | b'n' => Ok(EntryState::Normal), | |
601 | b'a' => Ok(EntryState::Added), |
|
617 | b'a' => Ok(EntryState::Added), | |
602 | b'r' => Ok(EntryState::Removed), |
|
618 | b'r' => Ok(EntryState::Removed), | |
603 | b'm' => Ok(EntryState::Merged), |
|
619 | b'm' => Ok(EntryState::Merged), | |
604 | _ => Err(HgError::CorruptedRepository(format!( |
|
620 | _ => Err(HgError::CorruptedRepository(format!( | |
605 | "Incorrect dirstate entry state {}", |
|
621 | "Incorrect dirstate entry state {}", | |
606 | value |
|
622 | value | |
607 | ))), |
|
623 | ))), | |
608 | } |
|
624 | } | |
609 | } |
|
625 | } | |
610 | } |
|
626 | } | |
611 |
|
627 | |||
612 | impl Into<u8> for EntryState { |
|
628 | impl Into<u8> for EntryState { | |
613 | fn into(self) -> u8 { |
|
629 | fn into(self) -> u8 { | |
614 | match self { |
|
630 | match self { | |
615 | EntryState::Normal => b'n', |
|
631 | EntryState::Normal => b'n', | |
616 | EntryState::Added => b'a', |
|
632 | EntryState::Added => b'a', | |
617 | EntryState::Removed => b'r', |
|
633 | EntryState::Removed => b'r', | |
618 | EntryState::Merged => b'm', |
|
634 | EntryState::Merged => b'm', | |
619 | } |
|
635 | } | |
620 | } |
|
636 | } | |
621 | } |
|
637 | } |
@@ -1,750 +1,773 b'' | |||||
1 | //! The "version 2" disk representation of the dirstate |
|
1 | //! The "version 2" disk representation of the dirstate | |
2 | //! |
|
2 | //! | |
3 | //! See `mercurial/helptext/internals/dirstate-v2.txt` |
|
3 | //! See `mercurial/helptext/internals/dirstate-v2.txt` | |
4 |
|
4 | |||
5 | use crate::dirstate::TruncatedTimestamp; |
|
5 | use crate::dirstate::TruncatedTimestamp; | |
6 | use crate::dirstate_tree::dirstate_map::{self, DirstateMap, NodeRef}; |
|
6 | use crate::dirstate_tree::dirstate_map::{self, DirstateMap, NodeRef}; | |
7 | use crate::dirstate_tree::path_with_basename::WithBasename; |
|
7 | use crate::dirstate_tree::path_with_basename::WithBasename; | |
8 | use crate::errors::HgError; |
|
8 | use crate::errors::HgError; | |
9 | use crate::utils::hg_path::HgPath; |
|
9 | use crate::utils::hg_path::HgPath; | |
10 | use crate::DirstateEntry; |
|
10 | use crate::DirstateEntry; | |
11 | use crate::DirstateError; |
|
11 | use crate::DirstateError; | |
12 | use crate::DirstateParents; |
|
12 | use crate::DirstateParents; | |
13 | use bitflags::bitflags; |
|
13 | use bitflags::bitflags; | |
14 | use bytes_cast::unaligned::{U16Be, U32Be}; |
|
14 | use bytes_cast::unaligned::{U16Be, U32Be}; | |
15 | use bytes_cast::BytesCast; |
|
15 | use bytes_cast::BytesCast; | |
16 | use format_bytes::format_bytes; |
|
16 | use format_bytes::format_bytes; | |
17 | use std::borrow::Cow; |
|
17 | use std::borrow::Cow; | |
18 | use std::convert::{TryFrom, TryInto}; |
|
18 | use std::convert::{TryFrom, TryInto}; | |
19 |
|
19 | |||
20 | /// Added at the start of `.hg/dirstate` when the "v2" format is used. |
|
20 | /// Added at the start of `.hg/dirstate` when the "v2" format is used. | |
21 | /// This a redundant sanity check more than an actual "magic number" since |
|
21 | /// This a redundant sanity check more than an actual "magic number" since | |
22 | /// `.hg/requires` already governs which format should be used. |
|
22 | /// `.hg/requires` already governs which format should be used. | |
23 | pub const V2_FORMAT_MARKER: &[u8; 12] = b"dirstate-v2\n"; |
|
23 | pub const V2_FORMAT_MARKER: &[u8; 12] = b"dirstate-v2\n"; | |
24 |
|
24 | |||
25 | /// Keep space for 256-bit hashes |
|
25 | /// Keep space for 256-bit hashes | |
26 | const STORED_NODE_ID_BYTES: usize = 32; |
|
26 | const STORED_NODE_ID_BYTES: usize = 32; | |
27 |
|
27 | |||
28 | /// β¦ even though only 160 bits are used for now, with SHA-1 |
|
28 | /// β¦ even though only 160 bits are used for now, with SHA-1 | |
29 | const USED_NODE_ID_BYTES: usize = 20; |
|
29 | const USED_NODE_ID_BYTES: usize = 20; | |
30 |
|
30 | |||
31 | pub(super) const IGNORE_PATTERNS_HASH_LEN: usize = 20; |
|
31 | pub(super) const IGNORE_PATTERNS_HASH_LEN: usize = 20; | |
32 | pub(super) type IgnorePatternsHash = [u8; IGNORE_PATTERNS_HASH_LEN]; |
|
32 | pub(super) type IgnorePatternsHash = [u8; IGNORE_PATTERNS_HASH_LEN]; | |
33 |
|
33 | |||
34 | /// Must match constants of the same names in `mercurial/dirstateutils/v2.py` |
|
34 | /// Must match constants of the same names in `mercurial/dirstateutils/v2.py` | |
35 | const TREE_METADATA_SIZE: usize = 44; |
|
35 | const TREE_METADATA_SIZE: usize = 44; | |
36 | const NODE_SIZE: usize = 44; |
|
36 | const NODE_SIZE: usize = 44; | |
37 |
|
37 | |||
38 | /// Make sure that size-affecting changes are made knowingly |
|
38 | /// Make sure that size-affecting changes are made knowingly | |
39 | #[allow(unused)] |
|
39 | #[allow(unused)] | |
40 | fn static_assert_size_of() { |
|
40 | fn static_assert_size_of() { | |
41 | let _ = std::mem::transmute::<TreeMetadata, [u8; TREE_METADATA_SIZE]>; |
|
41 | let _ = std::mem::transmute::<TreeMetadata, [u8; TREE_METADATA_SIZE]>; | |
42 | let _ = std::mem::transmute::<DocketHeader, [u8; TREE_METADATA_SIZE + 81]>; |
|
42 | let _ = std::mem::transmute::<DocketHeader, [u8; TREE_METADATA_SIZE + 81]>; | |
43 | let _ = std::mem::transmute::<Node, [u8; NODE_SIZE]>; |
|
43 | let _ = std::mem::transmute::<Node, [u8; NODE_SIZE]>; | |
44 | } |
|
44 | } | |
45 |
|
45 | |||
46 | // Must match `HEADER` in `mercurial/dirstateutils/docket.py` |
|
46 | // Must match `HEADER` in `mercurial/dirstateutils/docket.py` | |
47 | #[derive(BytesCast)] |
|
47 | #[derive(BytesCast)] | |
48 | #[repr(C)] |
|
48 | #[repr(C)] | |
49 | struct DocketHeader { |
|
49 | struct DocketHeader { | |
50 | marker: [u8; V2_FORMAT_MARKER.len()], |
|
50 | marker: [u8; V2_FORMAT_MARKER.len()], | |
51 | parent_1: [u8; STORED_NODE_ID_BYTES], |
|
51 | parent_1: [u8; STORED_NODE_ID_BYTES], | |
52 | parent_2: [u8; STORED_NODE_ID_BYTES], |
|
52 | parent_2: [u8; STORED_NODE_ID_BYTES], | |
53 |
|
53 | |||
54 | metadata: TreeMetadata, |
|
54 | metadata: TreeMetadata, | |
55 |
|
55 | |||
56 | /// Counted in bytes |
|
56 | /// Counted in bytes | |
57 | data_size: Size, |
|
57 | data_size: Size, | |
58 |
|
58 | |||
59 | uuid_size: u8, |
|
59 | uuid_size: u8, | |
60 | } |
|
60 | } | |
61 |
|
61 | |||
62 | pub struct Docket<'on_disk> { |
|
62 | pub struct Docket<'on_disk> { | |
63 | header: &'on_disk DocketHeader, |
|
63 | header: &'on_disk DocketHeader, | |
64 | uuid: &'on_disk [u8], |
|
64 | uuid: &'on_disk [u8], | |
65 | } |
|
65 | } | |
66 |
|
66 | |||
67 | /// Fields are documented in the *Tree metadata in the docket file* |
|
67 | /// Fields are documented in the *Tree metadata in the docket file* | |
68 | /// section of `mercurial/helptext/internals/dirstate-v2.txt` |
|
68 | /// section of `mercurial/helptext/internals/dirstate-v2.txt` | |
69 | #[derive(BytesCast)] |
|
69 | #[derive(BytesCast)] | |
70 | #[repr(C)] |
|
70 | #[repr(C)] | |
71 | struct TreeMetadata { |
|
71 | struct TreeMetadata { | |
72 | root_nodes: ChildNodes, |
|
72 | root_nodes: ChildNodes, | |
73 | nodes_with_entry_count: Size, |
|
73 | nodes_with_entry_count: Size, | |
74 | nodes_with_copy_source_count: Size, |
|
74 | nodes_with_copy_source_count: Size, | |
75 | unreachable_bytes: Size, |
|
75 | unreachable_bytes: Size, | |
76 | unused: [u8; 4], |
|
76 | unused: [u8; 4], | |
77 |
|
77 | |||
78 | /// See *Optional hash of ignore patterns* section of |
|
78 | /// See *Optional hash of ignore patterns* section of | |
79 | /// `mercurial/helptext/internals/dirstate-v2.txt` |
|
79 | /// `mercurial/helptext/internals/dirstate-v2.txt` | |
80 | ignore_patterns_hash: IgnorePatternsHash, |
|
80 | ignore_patterns_hash: IgnorePatternsHash, | |
81 | } |
|
81 | } | |
82 |
|
82 | |||
83 | /// Fields are documented in the *The data file format* |
|
83 | /// Fields are documented in the *The data file format* | |
84 | /// section of `mercurial/helptext/internals/dirstate-v2.txt` |
|
84 | /// section of `mercurial/helptext/internals/dirstate-v2.txt` | |
85 | #[derive(BytesCast)] |
|
85 | #[derive(BytesCast)] | |
86 | #[repr(C)] |
|
86 | #[repr(C)] | |
87 | pub(super) struct Node { |
|
87 | pub(super) struct Node { | |
88 | full_path: PathSlice, |
|
88 | full_path: PathSlice, | |
89 |
|
89 | |||
90 | /// In bytes from `self.full_path.start` |
|
90 | /// In bytes from `self.full_path.start` | |
91 | base_name_start: PathSize, |
|
91 | base_name_start: PathSize, | |
92 |
|
92 | |||
93 | copy_source: OptPathSlice, |
|
93 | copy_source: OptPathSlice, | |
94 | children: ChildNodes, |
|
94 | children: ChildNodes, | |
95 | pub(super) descendants_with_entry_count: Size, |
|
95 | pub(super) descendants_with_entry_count: Size, | |
96 | pub(super) tracked_descendants_count: Size, |
|
96 | pub(super) tracked_descendants_count: Size, | |
97 | flags: U16Be, |
|
97 | flags: U16Be, | |
98 | size: U32Be, |
|
98 | size: U32Be, | |
99 | mtime: PackedTruncatedTimestamp, |
|
99 | mtime: PackedTruncatedTimestamp, | |
100 | } |
|
100 | } | |
101 |
|
101 | |||
102 | bitflags! { |
|
102 | bitflags! { | |
103 | #[repr(C)] |
|
103 | #[repr(C)] | |
104 | struct Flags: u16 { |
|
104 | struct Flags: u16 { | |
105 | const WDIR_TRACKED = 1 << 0; |
|
105 | const WDIR_TRACKED = 1 << 0; | |
106 | const P1_TRACKED = 1 << 1; |
|
106 | const P1_TRACKED = 1 << 1; | |
107 | const P2_INFO = 1 << 2; |
|
107 | const P2_INFO = 1 << 2; | |
108 | const HAS_MODE_AND_SIZE = 1 << 3; |
|
108 | const HAS_MODE_AND_SIZE = 1 << 3; | |
109 | const HAS_FILE_MTIME = 1 << 4; |
|
109 | const HAS_FILE_MTIME = 1 << 4; | |
110 | const HAS_DIRECTORY_MTIME = 1 << 5; |
|
110 | const HAS_DIRECTORY_MTIME = 1 << 5; | |
111 | const MODE_EXEC_PERM = 1 << 6; |
|
111 | const MODE_EXEC_PERM = 1 << 6; | |
112 | const MODE_IS_SYMLINK = 1 << 7; |
|
112 | const MODE_IS_SYMLINK = 1 << 7; | |
113 | const EXPECTED_STATE_IS_MODIFIED = 1 << 8; |
|
113 | const EXPECTED_STATE_IS_MODIFIED = 1 << 8; | |
114 | const ALL_UNKNOWN_RECORDED = 1 << 9; |
|
114 | const ALL_UNKNOWN_RECORDED = 1 << 9; | |
115 | const ALL_IGNORED_RECORDED = 1 << 10; |
|
115 | const ALL_IGNORED_RECORDED = 1 << 10; | |
|
116 | const HAS_FALLBACK_EXEC = 1 << 11; | |||
|
117 | const FALLBACK_EXEC = 1 << 12; | |||
|
118 | const HAS_FALLBACK_SYMLINK = 1 << 13; | |||
|
119 | const FALLBACK_SYMLINK = 1 << 14; | |||
116 | } |
|
120 | } | |
117 | } |
|
121 | } | |
118 |
|
122 | |||
119 | /// Duration since the Unix epoch |
|
123 | /// Duration since the Unix epoch | |
120 | #[derive(BytesCast, Copy, Clone)] |
|
124 | #[derive(BytesCast, Copy, Clone)] | |
121 | #[repr(C)] |
|
125 | #[repr(C)] | |
122 | struct PackedTruncatedTimestamp { |
|
126 | struct PackedTruncatedTimestamp { | |
123 | truncated_seconds: U32Be, |
|
127 | truncated_seconds: U32Be, | |
124 | nanoseconds: U32Be, |
|
128 | nanoseconds: U32Be, | |
125 | } |
|
129 | } | |
126 |
|
130 | |||
127 | /// Counted in bytes from the start of the file |
|
131 | /// Counted in bytes from the start of the file | |
128 | /// |
|
132 | /// | |
129 | /// NOTE: not supporting `.hg/dirstate` files larger than 4 GiB. |
|
133 | /// NOTE: not supporting `.hg/dirstate` files larger than 4 GiB. | |
130 | type Offset = U32Be; |
|
134 | type Offset = U32Be; | |
131 |
|
135 | |||
132 | /// Counted in number of items |
|
136 | /// Counted in number of items | |
133 | /// |
|
137 | /// | |
134 | /// NOTE: we choose not to support counting more than 4 billion nodes anywhere. |
|
138 | /// NOTE: we choose not to support counting more than 4 billion nodes anywhere. | |
135 | type Size = U32Be; |
|
139 | type Size = U32Be; | |
136 |
|
140 | |||
137 | /// Counted in bytes |
|
141 | /// Counted in bytes | |
138 | /// |
|
142 | /// | |
139 | /// NOTE: we choose not to support file names/paths longer than 64 KiB. |
|
143 | /// NOTE: we choose not to support file names/paths longer than 64 KiB. | |
140 | type PathSize = U16Be; |
|
144 | type PathSize = U16Be; | |
141 |
|
145 | |||
142 | /// A contiguous sequence of `len` times `Node`, representing the child nodes |
|
146 | /// A contiguous sequence of `len` times `Node`, representing the child nodes | |
143 | /// of either some other node or of the repository root. |
|
147 | /// of either some other node or of the repository root. | |
144 | /// |
|
148 | /// | |
145 | /// Always sorted by ascending `full_path`, to allow binary search. |
|
149 | /// Always sorted by ascending `full_path`, to allow binary search. | |
146 | /// Since nodes with the same parent nodes also have the same parent path, |
|
150 | /// Since nodes with the same parent nodes also have the same parent path, | |
147 | /// only the `base_name`s need to be compared during binary search. |
|
151 | /// only the `base_name`s need to be compared during binary search. | |
148 | #[derive(BytesCast, Copy, Clone)] |
|
152 | #[derive(BytesCast, Copy, Clone)] | |
149 | #[repr(C)] |
|
153 | #[repr(C)] | |
150 | struct ChildNodes { |
|
154 | struct ChildNodes { | |
151 | start: Offset, |
|
155 | start: Offset, | |
152 | len: Size, |
|
156 | len: Size, | |
153 | } |
|
157 | } | |
154 |
|
158 | |||
155 | /// A `HgPath` of `len` bytes |
|
159 | /// A `HgPath` of `len` bytes | |
156 | #[derive(BytesCast, Copy, Clone)] |
|
160 | #[derive(BytesCast, Copy, Clone)] | |
157 | #[repr(C)] |
|
161 | #[repr(C)] | |
158 | struct PathSlice { |
|
162 | struct PathSlice { | |
159 | start: Offset, |
|
163 | start: Offset, | |
160 | len: PathSize, |
|
164 | len: PathSize, | |
161 | } |
|
165 | } | |
162 |
|
166 | |||
163 | /// Either nothing if `start == 0`, or a `HgPath` of `len` bytes |
|
167 | /// Either nothing if `start == 0`, or a `HgPath` of `len` bytes | |
164 | type OptPathSlice = PathSlice; |
|
168 | type OptPathSlice = PathSlice; | |
165 |
|
169 | |||
166 | /// Unexpected file format found in `.hg/dirstate` with the "v2" format. |
|
170 | /// Unexpected file format found in `.hg/dirstate` with the "v2" format. | |
167 | /// |
|
171 | /// | |
168 | /// This should only happen if Mercurial is buggy or a repository is corrupted. |
|
172 | /// This should only happen if Mercurial is buggy or a repository is corrupted. | |
169 | #[derive(Debug)] |
|
173 | #[derive(Debug)] | |
170 | pub struct DirstateV2ParseError; |
|
174 | pub struct DirstateV2ParseError; | |
171 |
|
175 | |||
172 | impl From<DirstateV2ParseError> for HgError { |
|
176 | impl From<DirstateV2ParseError> for HgError { | |
173 | fn from(_: DirstateV2ParseError) -> Self { |
|
177 | fn from(_: DirstateV2ParseError) -> Self { | |
174 | HgError::corrupted("dirstate-v2 parse error") |
|
178 | HgError::corrupted("dirstate-v2 parse error") | |
175 | } |
|
179 | } | |
176 | } |
|
180 | } | |
177 |
|
181 | |||
178 | impl From<DirstateV2ParseError> for crate::DirstateError { |
|
182 | impl From<DirstateV2ParseError> for crate::DirstateError { | |
179 | fn from(error: DirstateV2ParseError) -> Self { |
|
183 | fn from(error: DirstateV2ParseError) -> Self { | |
180 | HgError::from(error).into() |
|
184 | HgError::from(error).into() | |
181 | } |
|
185 | } | |
182 | } |
|
186 | } | |
183 |
|
187 | |||
184 | impl<'on_disk> Docket<'on_disk> { |
|
188 | impl<'on_disk> Docket<'on_disk> { | |
185 | pub fn parents(&self) -> DirstateParents { |
|
189 | pub fn parents(&self) -> DirstateParents { | |
186 | use crate::Node; |
|
190 | use crate::Node; | |
187 | let p1 = Node::try_from(&self.header.parent_1[..USED_NODE_ID_BYTES]) |
|
191 | let p1 = Node::try_from(&self.header.parent_1[..USED_NODE_ID_BYTES]) | |
188 | .unwrap() |
|
192 | .unwrap() | |
189 | .clone(); |
|
193 | .clone(); | |
190 | let p2 = Node::try_from(&self.header.parent_2[..USED_NODE_ID_BYTES]) |
|
194 | let p2 = Node::try_from(&self.header.parent_2[..USED_NODE_ID_BYTES]) | |
191 | .unwrap() |
|
195 | .unwrap() | |
192 | .clone(); |
|
196 | .clone(); | |
193 | DirstateParents { p1, p2 } |
|
197 | DirstateParents { p1, p2 } | |
194 | } |
|
198 | } | |
195 |
|
199 | |||
196 | pub fn tree_metadata(&self) -> &[u8] { |
|
200 | pub fn tree_metadata(&self) -> &[u8] { | |
197 | self.header.metadata.as_bytes() |
|
201 | self.header.metadata.as_bytes() | |
198 | } |
|
202 | } | |
199 |
|
203 | |||
200 | pub fn data_size(&self) -> usize { |
|
204 | pub fn data_size(&self) -> usize { | |
201 | // This `unwrap` could only panic on a 16-bit CPU |
|
205 | // This `unwrap` could only panic on a 16-bit CPU | |
202 | self.header.data_size.get().try_into().unwrap() |
|
206 | self.header.data_size.get().try_into().unwrap() | |
203 | } |
|
207 | } | |
204 |
|
208 | |||
205 | pub fn data_filename(&self) -> String { |
|
209 | pub fn data_filename(&self) -> String { | |
206 | String::from_utf8(format_bytes!(b"dirstate.{}", self.uuid)).unwrap() |
|
210 | String::from_utf8(format_bytes!(b"dirstate.{}", self.uuid)).unwrap() | |
207 | } |
|
211 | } | |
208 | } |
|
212 | } | |
209 |
|
213 | |||
210 | pub fn read_docket( |
|
214 | pub fn read_docket( | |
211 | on_disk: &[u8], |
|
215 | on_disk: &[u8], | |
212 | ) -> Result<Docket<'_>, DirstateV2ParseError> { |
|
216 | ) -> Result<Docket<'_>, DirstateV2ParseError> { | |
213 | let (header, uuid) = |
|
217 | let (header, uuid) = | |
214 | DocketHeader::from_bytes(on_disk).map_err(|_| DirstateV2ParseError)?; |
|
218 | DocketHeader::from_bytes(on_disk).map_err(|_| DirstateV2ParseError)?; | |
215 | let uuid_size = header.uuid_size as usize; |
|
219 | let uuid_size = header.uuid_size as usize; | |
216 | if header.marker == *V2_FORMAT_MARKER && uuid.len() == uuid_size { |
|
220 | if header.marker == *V2_FORMAT_MARKER && uuid.len() == uuid_size { | |
217 | Ok(Docket { header, uuid }) |
|
221 | Ok(Docket { header, uuid }) | |
218 | } else { |
|
222 | } else { | |
219 | Err(DirstateV2ParseError) |
|
223 | Err(DirstateV2ParseError) | |
220 | } |
|
224 | } | |
221 | } |
|
225 | } | |
222 |
|
226 | |||
223 | pub(super) fn read<'on_disk>( |
|
227 | pub(super) fn read<'on_disk>( | |
224 | on_disk: &'on_disk [u8], |
|
228 | on_disk: &'on_disk [u8], | |
225 | metadata: &[u8], |
|
229 | metadata: &[u8], | |
226 | ) -> Result<DirstateMap<'on_disk>, DirstateV2ParseError> { |
|
230 | ) -> Result<DirstateMap<'on_disk>, DirstateV2ParseError> { | |
227 | if on_disk.is_empty() { |
|
231 | if on_disk.is_empty() { | |
228 | return Ok(DirstateMap::empty(on_disk)); |
|
232 | return Ok(DirstateMap::empty(on_disk)); | |
229 | } |
|
233 | } | |
230 | let (meta, _) = TreeMetadata::from_bytes(metadata) |
|
234 | let (meta, _) = TreeMetadata::from_bytes(metadata) | |
231 | .map_err(|_| DirstateV2ParseError)?; |
|
235 | .map_err(|_| DirstateV2ParseError)?; | |
232 | let dirstate_map = DirstateMap { |
|
236 | let dirstate_map = DirstateMap { | |
233 | on_disk, |
|
237 | on_disk, | |
234 | root: dirstate_map::ChildNodes::OnDisk(read_nodes( |
|
238 | root: dirstate_map::ChildNodes::OnDisk(read_nodes( | |
235 | on_disk, |
|
239 | on_disk, | |
236 | meta.root_nodes, |
|
240 | meta.root_nodes, | |
237 | )?), |
|
241 | )?), | |
238 | nodes_with_entry_count: meta.nodes_with_entry_count.get(), |
|
242 | nodes_with_entry_count: meta.nodes_with_entry_count.get(), | |
239 | nodes_with_copy_source_count: meta.nodes_with_copy_source_count.get(), |
|
243 | nodes_with_copy_source_count: meta.nodes_with_copy_source_count.get(), | |
240 | ignore_patterns_hash: meta.ignore_patterns_hash, |
|
244 | ignore_patterns_hash: meta.ignore_patterns_hash, | |
241 | unreachable_bytes: meta.unreachable_bytes.get(), |
|
245 | unreachable_bytes: meta.unreachable_bytes.get(), | |
242 | }; |
|
246 | }; | |
243 | Ok(dirstate_map) |
|
247 | Ok(dirstate_map) | |
244 | } |
|
248 | } | |
245 |
|
249 | |||
246 | impl Node { |
|
250 | impl Node { | |
247 | pub(super) fn full_path<'on_disk>( |
|
251 | pub(super) fn full_path<'on_disk>( | |
248 | &self, |
|
252 | &self, | |
249 | on_disk: &'on_disk [u8], |
|
253 | on_disk: &'on_disk [u8], | |
250 | ) -> Result<&'on_disk HgPath, DirstateV2ParseError> { |
|
254 | ) -> Result<&'on_disk HgPath, DirstateV2ParseError> { | |
251 | read_hg_path(on_disk, self.full_path) |
|
255 | read_hg_path(on_disk, self.full_path) | |
252 | } |
|
256 | } | |
253 |
|
257 | |||
254 | pub(super) fn base_name_start<'on_disk>( |
|
258 | pub(super) fn base_name_start<'on_disk>( | |
255 | &self, |
|
259 | &self, | |
256 | ) -> Result<usize, DirstateV2ParseError> { |
|
260 | ) -> Result<usize, DirstateV2ParseError> { | |
257 | let start = self.base_name_start.get(); |
|
261 | let start = self.base_name_start.get(); | |
258 | if start < self.full_path.len.get() { |
|
262 | if start < self.full_path.len.get() { | |
259 | let start = usize::try_from(start) |
|
263 | let start = usize::try_from(start) | |
260 | // u32 -> usize, could only panic on a 16-bit CPU |
|
264 | // u32 -> usize, could only panic on a 16-bit CPU | |
261 | .expect("dirstate-v2 base_name_start out of bounds"); |
|
265 | .expect("dirstate-v2 base_name_start out of bounds"); | |
262 | Ok(start) |
|
266 | Ok(start) | |
263 | } else { |
|
267 | } else { | |
264 | Err(DirstateV2ParseError) |
|
268 | Err(DirstateV2ParseError) | |
265 | } |
|
269 | } | |
266 | } |
|
270 | } | |
267 |
|
271 | |||
268 | pub(super) fn base_name<'on_disk>( |
|
272 | pub(super) fn base_name<'on_disk>( | |
269 | &self, |
|
273 | &self, | |
270 | on_disk: &'on_disk [u8], |
|
274 | on_disk: &'on_disk [u8], | |
271 | ) -> Result<&'on_disk HgPath, DirstateV2ParseError> { |
|
275 | ) -> Result<&'on_disk HgPath, DirstateV2ParseError> { | |
272 | let full_path = self.full_path(on_disk)?; |
|
276 | let full_path = self.full_path(on_disk)?; | |
273 | let base_name_start = self.base_name_start()?; |
|
277 | let base_name_start = self.base_name_start()?; | |
274 | Ok(HgPath::new(&full_path.as_bytes()[base_name_start..])) |
|
278 | Ok(HgPath::new(&full_path.as_bytes()[base_name_start..])) | |
275 | } |
|
279 | } | |
276 |
|
280 | |||
277 | pub(super) fn path<'on_disk>( |
|
281 | pub(super) fn path<'on_disk>( | |
278 | &self, |
|
282 | &self, | |
279 | on_disk: &'on_disk [u8], |
|
283 | on_disk: &'on_disk [u8], | |
280 | ) -> Result<dirstate_map::NodeKey<'on_disk>, DirstateV2ParseError> { |
|
284 | ) -> Result<dirstate_map::NodeKey<'on_disk>, DirstateV2ParseError> { | |
281 | Ok(WithBasename::from_raw_parts( |
|
285 | Ok(WithBasename::from_raw_parts( | |
282 | Cow::Borrowed(self.full_path(on_disk)?), |
|
286 | Cow::Borrowed(self.full_path(on_disk)?), | |
283 | self.base_name_start()?, |
|
287 | self.base_name_start()?, | |
284 | )) |
|
288 | )) | |
285 | } |
|
289 | } | |
286 |
|
290 | |||
287 | pub(super) fn has_copy_source<'on_disk>(&self) -> bool { |
|
291 | pub(super) fn has_copy_source<'on_disk>(&self) -> bool { | |
288 | self.copy_source.start.get() != 0 |
|
292 | self.copy_source.start.get() != 0 | |
289 | } |
|
293 | } | |
290 |
|
294 | |||
291 | pub(super) fn copy_source<'on_disk>( |
|
295 | pub(super) fn copy_source<'on_disk>( | |
292 | &self, |
|
296 | &self, | |
293 | on_disk: &'on_disk [u8], |
|
297 | on_disk: &'on_disk [u8], | |
294 | ) -> Result<Option<&'on_disk HgPath>, DirstateV2ParseError> { |
|
298 | ) -> Result<Option<&'on_disk HgPath>, DirstateV2ParseError> { | |
295 | Ok(if self.has_copy_source() { |
|
299 | Ok(if self.has_copy_source() { | |
296 | Some(read_hg_path(on_disk, self.copy_source)?) |
|
300 | Some(read_hg_path(on_disk, self.copy_source)?) | |
297 | } else { |
|
301 | } else { | |
298 | None |
|
302 | None | |
299 | }) |
|
303 | }) | |
300 | } |
|
304 | } | |
301 |
|
305 | |||
302 | fn flags(&self) -> Flags { |
|
306 | fn flags(&self) -> Flags { | |
303 | Flags::from_bits_truncate(self.flags.get()) |
|
307 | Flags::from_bits_truncate(self.flags.get()) | |
304 | } |
|
308 | } | |
305 |
|
309 | |||
306 | fn has_entry(&self) -> bool { |
|
310 | fn has_entry(&self) -> bool { | |
307 | self.flags().intersects( |
|
311 | self.flags().intersects( | |
308 | Flags::WDIR_TRACKED | Flags::P1_TRACKED | Flags::P2_INFO, |
|
312 | Flags::WDIR_TRACKED | Flags::P1_TRACKED | Flags::P2_INFO, | |
309 | ) |
|
313 | ) | |
310 | } |
|
314 | } | |
311 |
|
315 | |||
312 | pub(super) fn node_data( |
|
316 | pub(super) fn node_data( | |
313 | &self, |
|
317 | &self, | |
314 | ) -> Result<dirstate_map::NodeData, DirstateV2ParseError> { |
|
318 | ) -> Result<dirstate_map::NodeData, DirstateV2ParseError> { | |
315 | if self.has_entry() { |
|
319 | if self.has_entry() { | |
316 | Ok(dirstate_map::NodeData::Entry(self.assume_entry())) |
|
320 | Ok(dirstate_map::NodeData::Entry(self.assume_entry())) | |
317 | } else if let Some(mtime) = self.cached_directory_mtime()? { |
|
321 | } else if let Some(mtime) = self.cached_directory_mtime()? { | |
318 | Ok(dirstate_map::NodeData::CachedDirectory { mtime }) |
|
322 | Ok(dirstate_map::NodeData::CachedDirectory { mtime }) | |
319 | } else { |
|
323 | } else { | |
320 | Ok(dirstate_map::NodeData::None) |
|
324 | Ok(dirstate_map::NodeData::None) | |
321 | } |
|
325 | } | |
322 | } |
|
326 | } | |
323 |
|
327 | |||
324 | pub(super) fn cached_directory_mtime( |
|
328 | pub(super) fn cached_directory_mtime( | |
325 | &self, |
|
329 | &self, | |
326 | ) -> Result<Option<TruncatedTimestamp>, DirstateV2ParseError> { |
|
330 | ) -> Result<Option<TruncatedTimestamp>, DirstateV2ParseError> { | |
327 | // For now we do not have code to handle ALL_UNKNOWN_RECORDED, so we |
|
331 | // For now we do not have code to handle ALL_UNKNOWN_RECORDED, so we | |
328 | // ignore the mtime if the flag is set. |
|
332 | // ignore the mtime if the flag is set. | |
329 | if self.flags().contains(Flags::HAS_DIRECTORY_MTIME) |
|
333 | if self.flags().contains(Flags::HAS_DIRECTORY_MTIME) | |
330 | && self.flags().contains(Flags::ALL_UNKNOWN_RECORDED) |
|
334 | && self.flags().contains(Flags::ALL_UNKNOWN_RECORDED) | |
331 | { |
|
335 | { | |
332 | if self.flags().contains(Flags::HAS_FILE_MTIME) { |
|
336 | if self.flags().contains(Flags::HAS_FILE_MTIME) { | |
333 | Err(DirstateV2ParseError) |
|
337 | Err(DirstateV2ParseError) | |
334 | } else { |
|
338 | } else { | |
335 | Ok(Some(self.mtime.try_into()?)) |
|
339 | Ok(Some(self.mtime.try_into()?)) | |
336 | } |
|
340 | } | |
337 | } else { |
|
341 | } else { | |
338 | Ok(None) |
|
342 | Ok(None) | |
339 | } |
|
343 | } | |
340 | } |
|
344 | } | |
341 |
|
345 | |||
342 | fn synthesize_unix_mode(&self) -> u32 { |
|
346 | fn synthesize_unix_mode(&self) -> u32 { | |
343 | let file_type = if self.flags().contains(Flags::MODE_IS_SYMLINK) { |
|
347 | let file_type = if self.flags().contains(Flags::MODE_IS_SYMLINK) { | |
344 | libc::S_IFLNK |
|
348 | libc::S_IFLNK | |
345 | } else { |
|
349 | } else { | |
346 | libc::S_IFREG |
|
350 | libc::S_IFREG | |
347 | }; |
|
351 | }; | |
348 | let permisions = if self.flags().contains(Flags::MODE_EXEC_PERM) { |
|
352 | let permisions = if self.flags().contains(Flags::MODE_EXEC_PERM) { | |
349 | 0o755 |
|
353 | 0o755 | |
350 | } else { |
|
354 | } else { | |
351 | 0o644 |
|
355 | 0o644 | |
352 | }; |
|
356 | }; | |
353 | file_type | permisions |
|
357 | file_type | permisions | |
354 | } |
|
358 | } | |
355 |
|
359 | |||
356 | fn assume_entry(&self) -> DirstateEntry { |
|
360 | fn assume_entry(&self) -> DirstateEntry { | |
357 | // TODO: convert through raw bits instead? |
|
361 | // TODO: convert through raw bits instead? | |
358 | let wdir_tracked = self.flags().contains(Flags::WDIR_TRACKED); |
|
362 | let wdir_tracked = self.flags().contains(Flags::WDIR_TRACKED); | |
359 | let p1_tracked = self.flags().contains(Flags::P1_TRACKED); |
|
363 | let p1_tracked = self.flags().contains(Flags::P1_TRACKED); | |
360 | let p2_info = self.flags().contains(Flags::P2_INFO); |
|
364 | let p2_info = self.flags().contains(Flags::P2_INFO); | |
361 | let mode_size = if self.flags().contains(Flags::HAS_MODE_AND_SIZE) |
|
365 | let mode_size = if self.flags().contains(Flags::HAS_MODE_AND_SIZE) | |
362 | && !self.flags().contains(Flags::EXPECTED_STATE_IS_MODIFIED) |
|
366 | && !self.flags().contains(Flags::EXPECTED_STATE_IS_MODIFIED) | |
363 | { |
|
367 | { | |
364 | Some((self.synthesize_unix_mode(), self.size.into())) |
|
368 | Some((self.synthesize_unix_mode(), self.size.into())) | |
365 | } else { |
|
369 | } else { | |
366 | None |
|
370 | None | |
367 | }; |
|
371 | }; | |
368 | let mtime = if self.flags().contains(Flags::HAS_FILE_MTIME) |
|
372 | let mtime = if self.flags().contains(Flags::HAS_FILE_MTIME) | |
369 | && !self.flags().contains(Flags::EXPECTED_STATE_IS_MODIFIED) |
|
373 | && !self.flags().contains(Flags::EXPECTED_STATE_IS_MODIFIED) | |
370 | { |
|
374 | { | |
371 | Some(self.mtime.truncated_seconds.into()) |
|
375 | Some(self.mtime.truncated_seconds.into()) | |
372 | } else { |
|
376 | } else { | |
373 | None |
|
377 | None | |
374 | }; |
|
378 | }; | |
375 | DirstateEntry::from_v2_data( |
|
379 | DirstateEntry::from_v2_data( | |
376 | wdir_tracked, |
|
380 | wdir_tracked, | |
377 | p1_tracked, |
|
381 | p1_tracked, | |
378 | p2_info, |
|
382 | p2_info, | |
379 | mode_size, |
|
383 | mode_size, | |
380 | mtime, |
|
384 | mtime, | |
381 | None, |
|
385 | None, | |
382 | None, |
|
386 | None, | |
383 | ) |
|
387 | ) | |
384 | } |
|
388 | } | |
385 |
|
389 | |||
386 | pub(super) fn entry( |
|
390 | pub(super) fn entry( | |
387 | &self, |
|
391 | &self, | |
388 | ) -> Result<Option<DirstateEntry>, DirstateV2ParseError> { |
|
392 | ) -> Result<Option<DirstateEntry>, DirstateV2ParseError> { | |
389 | if self.has_entry() { |
|
393 | if self.has_entry() { | |
390 | Ok(Some(self.assume_entry())) |
|
394 | Ok(Some(self.assume_entry())) | |
391 | } else { |
|
395 | } else { | |
392 | Ok(None) |
|
396 | Ok(None) | |
393 | } |
|
397 | } | |
394 | } |
|
398 | } | |
395 |
|
399 | |||
396 | pub(super) fn children<'on_disk>( |
|
400 | pub(super) fn children<'on_disk>( | |
397 | &self, |
|
401 | &self, | |
398 | on_disk: &'on_disk [u8], |
|
402 | on_disk: &'on_disk [u8], | |
399 | ) -> Result<&'on_disk [Node], DirstateV2ParseError> { |
|
403 | ) -> Result<&'on_disk [Node], DirstateV2ParseError> { | |
400 | read_nodes(on_disk, self.children) |
|
404 | read_nodes(on_disk, self.children) | |
401 | } |
|
405 | } | |
402 |
|
406 | |||
403 | pub(super) fn to_in_memory_node<'on_disk>( |
|
407 | pub(super) fn to_in_memory_node<'on_disk>( | |
404 | &self, |
|
408 | &self, | |
405 | on_disk: &'on_disk [u8], |
|
409 | on_disk: &'on_disk [u8], | |
406 | ) -> Result<dirstate_map::Node<'on_disk>, DirstateV2ParseError> { |
|
410 | ) -> Result<dirstate_map::Node<'on_disk>, DirstateV2ParseError> { | |
407 | Ok(dirstate_map::Node { |
|
411 | Ok(dirstate_map::Node { | |
408 | children: dirstate_map::ChildNodes::OnDisk( |
|
412 | children: dirstate_map::ChildNodes::OnDisk( | |
409 | self.children(on_disk)?, |
|
413 | self.children(on_disk)?, | |
410 | ), |
|
414 | ), | |
411 | copy_source: self.copy_source(on_disk)?.map(Cow::Borrowed), |
|
415 | copy_source: self.copy_source(on_disk)?.map(Cow::Borrowed), | |
412 | data: self.node_data()?, |
|
416 | data: self.node_data()?, | |
413 | descendants_with_entry_count: self |
|
417 | descendants_with_entry_count: self | |
414 | .descendants_with_entry_count |
|
418 | .descendants_with_entry_count | |
415 | .get(), |
|
419 | .get(), | |
416 | tracked_descendants_count: self.tracked_descendants_count.get(), |
|
420 | tracked_descendants_count: self.tracked_descendants_count.get(), | |
417 | }) |
|
421 | }) | |
418 | } |
|
422 | } | |
419 |
|
423 | |||
420 | fn from_dirstate_entry( |
|
424 | fn from_dirstate_entry( | |
421 | entry: &DirstateEntry, |
|
425 | entry: &DirstateEntry, | |
422 | ) -> (Flags, U32Be, PackedTruncatedTimestamp) { |
|
426 | ) -> (Flags, U32Be, PackedTruncatedTimestamp) { | |
423 | let (wdir_tracked, p1_tracked, p2_info, mode_size_opt, mtime_opt) = |
|
427 | let ( | |
424 | entry.v2_data(); |
|
428 | wdir_tracked, | |
|
429 | p1_tracked, | |||
|
430 | p2_info, | |||
|
431 | mode_size_opt, | |||
|
432 | mtime_opt, | |||
|
433 | fallback_exec, | |||
|
434 | fallback_symlink, | |||
|
435 | ) = entry.v2_data(); | |||
425 | // TODO: convert throug raw flag bits instead? |
|
436 | // TODO: convert throug raw flag bits instead? | |
426 | let mut flags = Flags::empty(); |
|
437 | let mut flags = Flags::empty(); | |
427 | flags.set(Flags::WDIR_TRACKED, wdir_tracked); |
|
438 | flags.set(Flags::WDIR_TRACKED, wdir_tracked); | |
428 | flags.set(Flags::P1_TRACKED, p1_tracked); |
|
439 | flags.set(Flags::P1_TRACKED, p1_tracked); | |
429 | flags.set(Flags::P2_INFO, p2_info); |
|
440 | flags.set(Flags::P2_INFO, p2_info); | |
430 | let size = if let Some((m, s)) = mode_size_opt { |
|
441 | let size = if let Some((m, s)) = mode_size_opt { | |
431 | let exec_perm = m & libc::S_IXUSR != 0; |
|
442 | let exec_perm = m & libc::S_IXUSR != 0; | |
432 | let is_symlink = m & libc::S_IFMT == libc::S_IFLNK; |
|
443 | let is_symlink = m & libc::S_IFMT == libc::S_IFLNK; | |
433 | flags.set(Flags::MODE_EXEC_PERM, exec_perm); |
|
444 | flags.set(Flags::MODE_EXEC_PERM, exec_perm); | |
434 | flags.set(Flags::MODE_IS_SYMLINK, is_symlink); |
|
445 | flags.set(Flags::MODE_IS_SYMLINK, is_symlink); | |
435 | flags.insert(Flags::HAS_MODE_AND_SIZE); |
|
446 | flags.insert(Flags::HAS_MODE_AND_SIZE); | |
436 | s.into() |
|
447 | s.into() | |
437 | } else { |
|
448 | } else { | |
438 | 0.into() |
|
449 | 0.into() | |
439 | }; |
|
450 | }; | |
440 | let mtime = if let Some(m) = mtime_opt { |
|
451 | let mtime = if let Some(m) = mtime_opt { | |
441 | flags.insert(Flags::HAS_FILE_MTIME); |
|
452 | flags.insert(Flags::HAS_FILE_MTIME); | |
442 | PackedTruncatedTimestamp { |
|
453 | PackedTruncatedTimestamp { | |
443 | truncated_seconds: m.into(), |
|
454 | truncated_seconds: m.into(), | |
444 | nanoseconds: 0.into(), |
|
455 | nanoseconds: 0.into(), | |
445 | } |
|
456 | } | |
446 | } else { |
|
457 | } else { | |
447 | PackedTruncatedTimestamp::null() |
|
458 | PackedTruncatedTimestamp::null() | |
448 | }; |
|
459 | }; | |
|
460 | if let Some(f_exec) = fallback_exec { | |||
|
461 | flags.insert(Flags::HAS_FALLBACK_EXEC); | |||
|
462 | if f_exec { | |||
|
463 | flags.insert(Flags::FALLBACK_EXEC); | |||
|
464 | } | |||
|
465 | } | |||
|
466 | if let Some(f_symlink) = fallback_symlink { | |||
|
467 | flags.insert(Flags::HAS_FALLBACK_SYMLINK); | |||
|
468 | if f_symlink { | |||
|
469 | flags.insert(Flags::FALLBACK_SYMLINK); | |||
|
470 | } | |||
|
471 | } | |||
449 | (flags, size, mtime) |
|
472 | (flags, size, mtime) | |
450 | } |
|
473 | } | |
451 | } |
|
474 | } | |
452 |
|
475 | |||
453 | fn read_hg_path( |
|
476 | fn read_hg_path( | |
454 | on_disk: &[u8], |
|
477 | on_disk: &[u8], | |
455 | slice: PathSlice, |
|
478 | slice: PathSlice, | |
456 | ) -> Result<&HgPath, DirstateV2ParseError> { |
|
479 | ) -> Result<&HgPath, DirstateV2ParseError> { | |
457 | read_slice(on_disk, slice.start, slice.len.get()).map(HgPath::new) |
|
480 | read_slice(on_disk, slice.start, slice.len.get()).map(HgPath::new) | |
458 | } |
|
481 | } | |
459 |
|
482 | |||
460 | fn read_nodes( |
|
483 | fn read_nodes( | |
461 | on_disk: &[u8], |
|
484 | on_disk: &[u8], | |
462 | slice: ChildNodes, |
|
485 | slice: ChildNodes, | |
463 | ) -> Result<&[Node], DirstateV2ParseError> { |
|
486 | ) -> Result<&[Node], DirstateV2ParseError> { | |
464 | read_slice(on_disk, slice.start, slice.len.get()) |
|
487 | read_slice(on_disk, slice.start, slice.len.get()) | |
465 | } |
|
488 | } | |
466 |
|
489 | |||
467 | fn read_slice<T, Len>( |
|
490 | fn read_slice<T, Len>( | |
468 | on_disk: &[u8], |
|
491 | on_disk: &[u8], | |
469 | start: Offset, |
|
492 | start: Offset, | |
470 | len: Len, |
|
493 | len: Len, | |
471 | ) -> Result<&[T], DirstateV2ParseError> |
|
494 | ) -> Result<&[T], DirstateV2ParseError> | |
472 | where |
|
495 | where | |
473 | T: BytesCast, |
|
496 | T: BytesCast, | |
474 | Len: TryInto<usize>, |
|
497 | Len: TryInto<usize>, | |
475 | { |
|
498 | { | |
476 | // Either `usize::MAX` would result in "out of bounds" error since a single |
|
499 | // Either `usize::MAX` would result in "out of bounds" error since a single | |
477 | // `&[u8]` cannot occupy the entire addess space. |
|
500 | // `&[u8]` cannot occupy the entire addess space. | |
478 | let start = start.get().try_into().unwrap_or(std::usize::MAX); |
|
501 | let start = start.get().try_into().unwrap_or(std::usize::MAX); | |
479 | let len = len.try_into().unwrap_or(std::usize::MAX); |
|
502 | let len = len.try_into().unwrap_or(std::usize::MAX); | |
480 | on_disk |
|
503 | on_disk | |
481 | .get(start..) |
|
504 | .get(start..) | |
482 | .and_then(|bytes| T::slice_from_bytes(bytes, len).ok()) |
|
505 | .and_then(|bytes| T::slice_from_bytes(bytes, len).ok()) | |
483 | .map(|(slice, _rest)| slice) |
|
506 | .map(|(slice, _rest)| slice) | |
484 | .ok_or_else(|| DirstateV2ParseError) |
|
507 | .ok_or_else(|| DirstateV2ParseError) | |
485 | } |
|
508 | } | |
486 |
|
509 | |||
487 | pub(crate) fn for_each_tracked_path<'on_disk>( |
|
510 | pub(crate) fn for_each_tracked_path<'on_disk>( | |
488 | on_disk: &'on_disk [u8], |
|
511 | on_disk: &'on_disk [u8], | |
489 | metadata: &[u8], |
|
512 | metadata: &[u8], | |
490 | mut f: impl FnMut(&'on_disk HgPath), |
|
513 | mut f: impl FnMut(&'on_disk HgPath), | |
491 | ) -> Result<(), DirstateV2ParseError> { |
|
514 | ) -> Result<(), DirstateV2ParseError> { | |
492 | let (meta, _) = TreeMetadata::from_bytes(metadata) |
|
515 | let (meta, _) = TreeMetadata::from_bytes(metadata) | |
493 | .map_err(|_| DirstateV2ParseError)?; |
|
516 | .map_err(|_| DirstateV2ParseError)?; | |
494 | fn recur<'on_disk>( |
|
517 | fn recur<'on_disk>( | |
495 | on_disk: &'on_disk [u8], |
|
518 | on_disk: &'on_disk [u8], | |
496 | nodes: ChildNodes, |
|
519 | nodes: ChildNodes, | |
497 | f: &mut impl FnMut(&'on_disk HgPath), |
|
520 | f: &mut impl FnMut(&'on_disk HgPath), | |
498 | ) -> Result<(), DirstateV2ParseError> { |
|
521 | ) -> Result<(), DirstateV2ParseError> { | |
499 | for node in read_nodes(on_disk, nodes)? { |
|
522 | for node in read_nodes(on_disk, nodes)? { | |
500 | if let Some(entry) = node.entry()? { |
|
523 | if let Some(entry) = node.entry()? { | |
501 | if entry.state().is_tracked() { |
|
524 | if entry.state().is_tracked() { | |
502 | f(node.full_path(on_disk)?) |
|
525 | f(node.full_path(on_disk)?) | |
503 | } |
|
526 | } | |
504 | } |
|
527 | } | |
505 | recur(on_disk, node.children, f)? |
|
528 | recur(on_disk, node.children, f)? | |
506 | } |
|
529 | } | |
507 | Ok(()) |
|
530 | Ok(()) | |
508 | } |
|
531 | } | |
509 | recur(on_disk, meta.root_nodes, &mut f) |
|
532 | recur(on_disk, meta.root_nodes, &mut f) | |
510 | } |
|
533 | } | |
511 |
|
534 | |||
512 | /// Returns new data and metadata, together with whether that data should be |
|
535 | /// Returns new data and metadata, together with whether that data should be | |
513 | /// appended to the existing data file whose content is at |
|
536 | /// appended to the existing data file whose content is at | |
514 | /// `dirstate_map.on_disk` (true), instead of written to a new data file |
|
537 | /// `dirstate_map.on_disk` (true), instead of written to a new data file | |
515 | /// (false). |
|
538 | /// (false). | |
516 | pub(super) fn write( |
|
539 | pub(super) fn write( | |
517 | dirstate_map: &mut DirstateMap, |
|
540 | dirstate_map: &mut DirstateMap, | |
518 | can_append: bool, |
|
541 | can_append: bool, | |
519 | ) -> Result<(Vec<u8>, Vec<u8>, bool), DirstateError> { |
|
542 | ) -> Result<(Vec<u8>, Vec<u8>, bool), DirstateError> { | |
520 | let append = can_append && dirstate_map.write_should_append(); |
|
543 | let append = can_append && dirstate_map.write_should_append(); | |
521 |
|
544 | |||
522 | // This ignores the space for paths, and for nodes without an entry. |
|
545 | // This ignores the space for paths, and for nodes without an entry. | |
523 | // TODO: better estimate? Skip the `Vec` and write to a file directly? |
|
546 | // TODO: better estimate? Skip the `Vec` and write to a file directly? | |
524 | let size_guess = std::mem::size_of::<Node>() |
|
547 | let size_guess = std::mem::size_of::<Node>() | |
525 | * dirstate_map.nodes_with_entry_count as usize; |
|
548 | * dirstate_map.nodes_with_entry_count as usize; | |
526 |
|
549 | |||
527 | let mut writer = Writer { |
|
550 | let mut writer = Writer { | |
528 | dirstate_map, |
|
551 | dirstate_map, | |
529 | append, |
|
552 | append, | |
530 | out: Vec::with_capacity(size_guess), |
|
553 | out: Vec::with_capacity(size_guess), | |
531 | }; |
|
554 | }; | |
532 |
|
555 | |||
533 | let root_nodes = writer.write_nodes(dirstate_map.root.as_ref())?; |
|
556 | let root_nodes = writer.write_nodes(dirstate_map.root.as_ref())?; | |
534 |
|
557 | |||
535 | let meta = TreeMetadata { |
|
558 | let meta = TreeMetadata { | |
536 | root_nodes, |
|
559 | root_nodes, | |
537 | nodes_with_entry_count: dirstate_map.nodes_with_entry_count.into(), |
|
560 | nodes_with_entry_count: dirstate_map.nodes_with_entry_count.into(), | |
538 | nodes_with_copy_source_count: dirstate_map |
|
561 | nodes_with_copy_source_count: dirstate_map | |
539 | .nodes_with_copy_source_count |
|
562 | .nodes_with_copy_source_count | |
540 | .into(), |
|
563 | .into(), | |
541 | unreachable_bytes: dirstate_map.unreachable_bytes.into(), |
|
564 | unreachable_bytes: dirstate_map.unreachable_bytes.into(), | |
542 | unused: [0; 4], |
|
565 | unused: [0; 4], | |
543 | ignore_patterns_hash: dirstate_map.ignore_patterns_hash, |
|
566 | ignore_patterns_hash: dirstate_map.ignore_patterns_hash, | |
544 | }; |
|
567 | }; | |
545 | Ok((writer.out, meta.as_bytes().to_vec(), append)) |
|
568 | Ok((writer.out, meta.as_bytes().to_vec(), append)) | |
546 | } |
|
569 | } | |
547 |
|
570 | |||
548 | struct Writer<'dmap, 'on_disk> { |
|
571 | struct Writer<'dmap, 'on_disk> { | |
549 | dirstate_map: &'dmap DirstateMap<'on_disk>, |
|
572 | dirstate_map: &'dmap DirstateMap<'on_disk>, | |
550 | append: bool, |
|
573 | append: bool, | |
551 | out: Vec<u8>, |
|
574 | out: Vec<u8>, | |
552 | } |
|
575 | } | |
553 |
|
576 | |||
554 | impl Writer<'_, '_> { |
|
577 | impl Writer<'_, '_> { | |
555 | fn write_nodes( |
|
578 | fn write_nodes( | |
556 | &mut self, |
|
579 | &mut self, | |
557 | nodes: dirstate_map::ChildNodesRef, |
|
580 | nodes: dirstate_map::ChildNodesRef, | |
558 | ) -> Result<ChildNodes, DirstateError> { |
|
581 | ) -> Result<ChildNodes, DirstateError> { | |
559 | // Reuse already-written nodes if possible |
|
582 | // Reuse already-written nodes if possible | |
560 | if self.append { |
|
583 | if self.append { | |
561 | if let dirstate_map::ChildNodesRef::OnDisk(nodes_slice) = nodes { |
|
584 | if let dirstate_map::ChildNodesRef::OnDisk(nodes_slice) = nodes { | |
562 | let start = self.on_disk_offset_of(nodes_slice).expect( |
|
585 | let start = self.on_disk_offset_of(nodes_slice).expect( | |
563 | "dirstate-v2 OnDisk nodes not found within on_disk", |
|
586 | "dirstate-v2 OnDisk nodes not found within on_disk", | |
564 | ); |
|
587 | ); | |
565 | let len = child_nodes_len_from_usize(nodes_slice.len()); |
|
588 | let len = child_nodes_len_from_usize(nodes_slice.len()); | |
566 | return Ok(ChildNodes { start, len }); |
|
589 | return Ok(ChildNodes { start, len }); | |
567 | } |
|
590 | } | |
568 | } |
|
591 | } | |
569 |
|
592 | |||
570 | // `dirstate_map::ChildNodes::InMemory` contains a `HashMap` which has |
|
593 | // `dirstate_map::ChildNodes::InMemory` contains a `HashMap` which has | |
571 | // undefined iteration order. Sort to enable binary search in the |
|
594 | // undefined iteration order. Sort to enable binary search in the | |
572 | // written file. |
|
595 | // written file. | |
573 | let nodes = nodes.sorted(); |
|
596 | let nodes = nodes.sorted(); | |
574 | let nodes_len = nodes.len(); |
|
597 | let nodes_len = nodes.len(); | |
575 |
|
598 | |||
576 | // First accumulate serialized nodes in a `Vec` |
|
599 | // First accumulate serialized nodes in a `Vec` | |
577 | let mut on_disk_nodes = Vec::with_capacity(nodes_len); |
|
600 | let mut on_disk_nodes = Vec::with_capacity(nodes_len); | |
578 | for node in nodes { |
|
601 | for node in nodes { | |
579 | let children = |
|
602 | let children = | |
580 | self.write_nodes(node.children(self.dirstate_map.on_disk)?)?; |
|
603 | self.write_nodes(node.children(self.dirstate_map.on_disk)?)?; | |
581 | let full_path = node.full_path(self.dirstate_map.on_disk)?; |
|
604 | let full_path = node.full_path(self.dirstate_map.on_disk)?; | |
582 | let full_path = self.write_path(full_path.as_bytes()); |
|
605 | let full_path = self.write_path(full_path.as_bytes()); | |
583 | let copy_source = if let Some(source) = |
|
606 | let copy_source = if let Some(source) = | |
584 | node.copy_source(self.dirstate_map.on_disk)? |
|
607 | node.copy_source(self.dirstate_map.on_disk)? | |
585 | { |
|
608 | { | |
586 | self.write_path(source.as_bytes()) |
|
609 | self.write_path(source.as_bytes()) | |
587 | } else { |
|
610 | } else { | |
588 | PathSlice { |
|
611 | PathSlice { | |
589 | start: 0.into(), |
|
612 | start: 0.into(), | |
590 | len: 0.into(), |
|
613 | len: 0.into(), | |
591 | } |
|
614 | } | |
592 | }; |
|
615 | }; | |
593 | on_disk_nodes.push(match node { |
|
616 | on_disk_nodes.push(match node { | |
594 | NodeRef::InMemory(path, node) => { |
|
617 | NodeRef::InMemory(path, node) => { | |
595 | let (flags, size, mtime) = match &node.data { |
|
618 | let (flags, size, mtime) = match &node.data { | |
596 | dirstate_map::NodeData::Entry(entry) => { |
|
619 | dirstate_map::NodeData::Entry(entry) => { | |
597 | Node::from_dirstate_entry(entry) |
|
620 | Node::from_dirstate_entry(entry) | |
598 | } |
|
621 | } | |
599 | dirstate_map::NodeData::CachedDirectory { mtime } => ( |
|
622 | dirstate_map::NodeData::CachedDirectory { mtime } => ( | |
600 | // we currently never set a mtime if unknown file |
|
623 | // we currently never set a mtime if unknown file | |
601 | // are present. |
|
624 | // are present. | |
602 | // So if we have a mtime for a directory, we know |
|
625 | // So if we have a mtime for a directory, we know | |
603 | // they are no unknown |
|
626 | // they are no unknown | |
604 | // files and we |
|
627 | // files and we | |
605 | // blindly set ALL_UNKNOWN_RECORDED. |
|
628 | // blindly set ALL_UNKNOWN_RECORDED. | |
606 | // |
|
629 | // | |
607 | // We never set ALL_IGNORED_RECORDED since we |
|
630 | // We never set ALL_IGNORED_RECORDED since we | |
608 | // don't track that case |
|
631 | // don't track that case | |
609 | // currently. |
|
632 | // currently. | |
610 | Flags::HAS_DIRECTORY_MTIME |
|
633 | Flags::HAS_DIRECTORY_MTIME | |
611 | | Flags::ALL_UNKNOWN_RECORDED, |
|
634 | | Flags::ALL_UNKNOWN_RECORDED, | |
612 | 0.into(), |
|
635 | 0.into(), | |
613 | (*mtime).into(), |
|
636 | (*mtime).into(), | |
614 | ), |
|
637 | ), | |
615 | dirstate_map::NodeData::None => ( |
|
638 | dirstate_map::NodeData::None => ( | |
616 | Flags::empty(), |
|
639 | Flags::empty(), | |
617 | 0.into(), |
|
640 | 0.into(), | |
618 | PackedTruncatedTimestamp::null(), |
|
641 | PackedTruncatedTimestamp::null(), | |
619 | ), |
|
642 | ), | |
620 | }; |
|
643 | }; | |
621 | Node { |
|
644 | Node { | |
622 | children, |
|
645 | children, | |
623 | copy_source, |
|
646 | copy_source, | |
624 | full_path, |
|
647 | full_path, | |
625 | base_name_start: u16::try_from(path.base_name_start()) |
|
648 | base_name_start: u16::try_from(path.base_name_start()) | |
626 | // Could only panic for paths over 64 KiB |
|
649 | // Could only panic for paths over 64 KiB | |
627 | .expect("dirstate-v2 path length overflow") |
|
650 | .expect("dirstate-v2 path length overflow") | |
628 | .into(), |
|
651 | .into(), | |
629 | descendants_with_entry_count: node |
|
652 | descendants_with_entry_count: node | |
630 | .descendants_with_entry_count |
|
653 | .descendants_with_entry_count | |
631 | .into(), |
|
654 | .into(), | |
632 | tracked_descendants_count: node |
|
655 | tracked_descendants_count: node | |
633 | .tracked_descendants_count |
|
656 | .tracked_descendants_count | |
634 | .into(), |
|
657 | .into(), | |
635 | flags: flags.bits().into(), |
|
658 | flags: flags.bits().into(), | |
636 | size, |
|
659 | size, | |
637 | mtime, |
|
660 | mtime, | |
638 | } |
|
661 | } | |
639 | } |
|
662 | } | |
640 | NodeRef::OnDisk(node) => Node { |
|
663 | NodeRef::OnDisk(node) => Node { | |
641 | children, |
|
664 | children, | |
642 | copy_source, |
|
665 | copy_source, | |
643 | full_path, |
|
666 | full_path, | |
644 | ..*node |
|
667 | ..*node | |
645 | }, |
|
668 | }, | |
646 | }) |
|
669 | }) | |
647 | } |
|
670 | } | |
648 | // β¦ so we can write them contiguously, after writing everything else |
|
671 | // β¦ so we can write them contiguously, after writing everything else | |
649 | // they refer to. |
|
672 | // they refer to. | |
650 | let start = self.current_offset(); |
|
673 | let start = self.current_offset(); | |
651 | let len = child_nodes_len_from_usize(nodes_len); |
|
674 | let len = child_nodes_len_from_usize(nodes_len); | |
652 | self.out.extend(on_disk_nodes.as_bytes()); |
|
675 | self.out.extend(on_disk_nodes.as_bytes()); | |
653 | Ok(ChildNodes { start, len }) |
|
676 | Ok(ChildNodes { start, len }) | |
654 | } |
|
677 | } | |
655 |
|
678 | |||
656 | /// If the given slice of items is within `on_disk`, returns its offset |
|
679 | /// If the given slice of items is within `on_disk`, returns its offset | |
657 | /// from the start of `on_disk`. |
|
680 | /// from the start of `on_disk`. | |
658 | fn on_disk_offset_of<T>(&self, slice: &[T]) -> Option<Offset> |
|
681 | fn on_disk_offset_of<T>(&self, slice: &[T]) -> Option<Offset> | |
659 | where |
|
682 | where | |
660 | T: BytesCast, |
|
683 | T: BytesCast, | |
661 | { |
|
684 | { | |
662 | fn address_range(slice: &[u8]) -> std::ops::RangeInclusive<usize> { |
|
685 | fn address_range(slice: &[u8]) -> std::ops::RangeInclusive<usize> { | |
663 | let start = slice.as_ptr() as usize; |
|
686 | let start = slice.as_ptr() as usize; | |
664 | let end = start + slice.len(); |
|
687 | let end = start + slice.len(); | |
665 | start..=end |
|
688 | start..=end | |
666 | } |
|
689 | } | |
667 | let slice_addresses = address_range(slice.as_bytes()); |
|
690 | let slice_addresses = address_range(slice.as_bytes()); | |
668 | let on_disk_addresses = address_range(self.dirstate_map.on_disk); |
|
691 | let on_disk_addresses = address_range(self.dirstate_map.on_disk); | |
669 | if on_disk_addresses.contains(slice_addresses.start()) |
|
692 | if on_disk_addresses.contains(slice_addresses.start()) | |
670 | && on_disk_addresses.contains(slice_addresses.end()) |
|
693 | && on_disk_addresses.contains(slice_addresses.end()) | |
671 | { |
|
694 | { | |
672 | let offset = slice_addresses.start() - on_disk_addresses.start(); |
|
695 | let offset = slice_addresses.start() - on_disk_addresses.start(); | |
673 | Some(offset_from_usize(offset)) |
|
696 | Some(offset_from_usize(offset)) | |
674 | } else { |
|
697 | } else { | |
675 | None |
|
698 | None | |
676 | } |
|
699 | } | |
677 | } |
|
700 | } | |
678 |
|
701 | |||
679 | fn current_offset(&mut self) -> Offset { |
|
702 | fn current_offset(&mut self) -> Offset { | |
680 | let mut offset = self.out.len(); |
|
703 | let mut offset = self.out.len(); | |
681 | if self.append { |
|
704 | if self.append { | |
682 | offset += self.dirstate_map.on_disk.len() |
|
705 | offset += self.dirstate_map.on_disk.len() | |
683 | } |
|
706 | } | |
684 | offset_from_usize(offset) |
|
707 | offset_from_usize(offset) | |
685 | } |
|
708 | } | |
686 |
|
709 | |||
687 | fn write_path(&mut self, slice: &[u8]) -> PathSlice { |
|
710 | fn write_path(&mut self, slice: &[u8]) -> PathSlice { | |
688 | let len = path_len_from_usize(slice.len()); |
|
711 | let len = path_len_from_usize(slice.len()); | |
689 | // Reuse an already-written path if possible |
|
712 | // Reuse an already-written path if possible | |
690 | if self.append { |
|
713 | if self.append { | |
691 | if let Some(start) = self.on_disk_offset_of(slice) { |
|
714 | if let Some(start) = self.on_disk_offset_of(slice) { | |
692 | return PathSlice { start, len }; |
|
715 | return PathSlice { start, len }; | |
693 | } |
|
716 | } | |
694 | } |
|
717 | } | |
695 | let start = self.current_offset(); |
|
718 | let start = self.current_offset(); | |
696 | self.out.extend(slice.as_bytes()); |
|
719 | self.out.extend(slice.as_bytes()); | |
697 | PathSlice { start, len } |
|
720 | PathSlice { start, len } | |
698 | } |
|
721 | } | |
699 | } |
|
722 | } | |
700 |
|
723 | |||
701 | fn offset_from_usize(x: usize) -> Offset { |
|
724 | fn offset_from_usize(x: usize) -> Offset { | |
702 | u32::try_from(x) |
|
725 | u32::try_from(x) | |
703 | // Could only panic for a dirstate file larger than 4 GiB |
|
726 | // Could only panic for a dirstate file larger than 4 GiB | |
704 | .expect("dirstate-v2 offset overflow") |
|
727 | .expect("dirstate-v2 offset overflow") | |
705 | .into() |
|
728 | .into() | |
706 | } |
|
729 | } | |
707 |
|
730 | |||
708 | fn child_nodes_len_from_usize(x: usize) -> Size { |
|
731 | fn child_nodes_len_from_usize(x: usize) -> Size { | |
709 | u32::try_from(x) |
|
732 | u32::try_from(x) | |
710 | // Could only panic with over 4 billion nodes |
|
733 | // Could only panic with over 4 billion nodes | |
711 | .expect("dirstate-v2 slice length overflow") |
|
734 | .expect("dirstate-v2 slice length overflow") | |
712 | .into() |
|
735 | .into() | |
713 | } |
|
736 | } | |
714 |
|
737 | |||
715 | fn path_len_from_usize(x: usize) -> PathSize { |
|
738 | fn path_len_from_usize(x: usize) -> PathSize { | |
716 | u16::try_from(x) |
|
739 | u16::try_from(x) | |
717 | // Could only panic for paths over 64 KiB |
|
740 | // Could only panic for paths over 64 KiB | |
718 | .expect("dirstate-v2 path length overflow") |
|
741 | .expect("dirstate-v2 path length overflow") | |
719 | .into() |
|
742 | .into() | |
720 | } |
|
743 | } | |
721 |
|
744 | |||
722 | impl From<TruncatedTimestamp> for PackedTruncatedTimestamp { |
|
745 | impl From<TruncatedTimestamp> for PackedTruncatedTimestamp { | |
723 | fn from(timestamp: TruncatedTimestamp) -> Self { |
|
746 | fn from(timestamp: TruncatedTimestamp) -> Self { | |
724 | Self { |
|
747 | Self { | |
725 | truncated_seconds: timestamp.truncated_seconds().into(), |
|
748 | truncated_seconds: timestamp.truncated_seconds().into(), | |
726 | nanoseconds: timestamp.nanoseconds().into(), |
|
749 | nanoseconds: timestamp.nanoseconds().into(), | |
727 | } |
|
750 | } | |
728 | } |
|
751 | } | |
729 | } |
|
752 | } | |
730 |
|
753 | |||
731 | impl TryFrom<PackedTruncatedTimestamp> for TruncatedTimestamp { |
|
754 | impl TryFrom<PackedTruncatedTimestamp> for TruncatedTimestamp { | |
732 | type Error = DirstateV2ParseError; |
|
755 | type Error = DirstateV2ParseError; | |
733 |
|
756 | |||
734 | fn try_from( |
|
757 | fn try_from( | |
735 | timestamp: PackedTruncatedTimestamp, |
|
758 | timestamp: PackedTruncatedTimestamp, | |
736 | ) -> Result<Self, Self::Error> { |
|
759 | ) -> Result<Self, Self::Error> { | |
737 | Self::from_already_truncated( |
|
760 | Self::from_already_truncated( | |
738 | timestamp.truncated_seconds.get(), |
|
761 | timestamp.truncated_seconds.get(), | |
739 | timestamp.nanoseconds.get(), |
|
762 | timestamp.nanoseconds.get(), | |
740 | ) |
|
763 | ) | |
741 | } |
|
764 | } | |
742 | } |
|
765 | } | |
743 | impl PackedTruncatedTimestamp { |
|
766 | impl PackedTruncatedTimestamp { | |
744 | fn null() -> Self { |
|
767 | fn null() -> Self { | |
745 | Self { |
|
768 | Self { | |
746 | truncated_seconds: 0.into(), |
|
769 | truncated_seconds: 0.into(), | |
747 | nanoseconds: 0.into(), |
|
770 | nanoseconds: 0.into(), | |
748 | } |
|
771 | } | |
749 | } |
|
772 | } | |
750 | } |
|
773 | } |
General Comments 0
You need to be logged in to leave comments.
Login now