##// END OF EJS Templates
eol: mention the hook in the module docstring
Martin Geisler -
r12980:20974e51 stable
parent child Browse files
Show More
@@ -1,261 +1,266
1 1 """automatically manage newlines in repository files
2 2
3 3 This extension allows you to manage the type of line endings (CRLF or
4 4 LF) that are used in the repository and in the local working
5 5 directory. That way you can get CRLF line endings on Windows and LF on
6 6 Unix/Mac, thereby letting everybody use their OS native line endings.
7 7
8 8 The extension reads its configuration from a versioned ``.hgeol``
9 9 configuration file every time you run an ``hg`` command. The
10 10 ``.hgeol`` file use the same syntax as all other Mercurial
11 11 configuration files. It uses two sections, ``[patterns]`` and
12 12 ``[repository]``.
13 13
14 14 The ``[patterns]`` section specifies the line endings used in the
15 15 working directory. The format is specified by a file pattern. The
16 16 first match is used, so put more specific patterns first. The
17 17 available line endings are ``LF``, ``CRLF``, and ``BIN``.
18 18
19 19 Files with the declared format of ``CRLF`` or ``LF`` are always
20 20 checked out in that format and files declared to be binary (``BIN``)
21 21 are left unchanged. Additionally, ``native`` is an alias for the
22 22 platform's default line ending: ``LF`` on Unix (including Mac OS X)
23 23 and ``CRLF`` on Windows. Note that ``BIN`` (do nothing to line
24 24 endings) is Mercurial's default behaviour; it is only needed if you
25 25 need to override a later, more general pattern.
26 26
27 27 The optional ``[repository]`` section specifies the line endings to
28 28 use for files stored in the repository. It has a single setting,
29 29 ``native``, which determines the storage line endings for files
30 30 declared as ``native`` in the ``[patterns]`` section. It can be set to
31 31 ``LF`` or ``CRLF``. The default is ``LF``. For example, this means
32 32 that on Windows, files configured as ``native`` (``CRLF`` by default)
33 33 will be converted to ``LF`` when stored in the repository. Files
34 34 declared as ``LF``, ``CRLF``, or ``BIN`` in the ``[patterns]`` section
35 35 are always stored as-is in the repository.
36 36
37 37 Example versioned ``.hgeol`` file::
38 38
39 39 [patterns]
40 40 **.py = native
41 41 **.vcproj = CRLF
42 42 **.txt = native
43 43 Makefile = LF
44 44 **.jpg = BIN
45 45
46 46 [repository]
47 47 native = LF
48 48
49 49 The extension uses an optional ``[eol]`` section in your hgrc file
50 50 (not the ``.hgeol`` file) for settings that control the overall
51 51 behavior. There are two settings:
52 52
53 53 - ``eol.native`` (default ``os.linesep``) can be set to ``LF`` or
54 54 ``CRLF`` to override the default interpretation of ``native`` for
55 55 checkout. This can be used with :hg:`archive` on Unix, say, to
56 56 generate an archive where files have line endings for Windows.
57 57
58 58 - ``eol.only-consistent`` (default True) can be set to False to make
59 59 the extension convert files with inconsistent EOLs. Inconsistent
60 60 means that there is both ``CRLF`` and ``LF`` present in the file.
61 61 Such files are normally not touched under the assumption that they
62 62 have mixed EOLs on purpose.
63 63
64 The ``win32text.forbid*`` hooks provided by the win32text extension
65 have been unified into a single hook named ``eol.hook``. The hook will
66 lookup the expected line endings from the ``.hgeol`` file, which means
67 you must migrate to a ``.hgeol`` file first before using the hook.
68
64 69 See :hg:`help patterns` for more information about the glob patterns
65 70 used.
66 71 """
67 72
68 73 from mercurial.i18n import _
69 74 from mercurial import util, config, extensions, match
70 75 import re, os
71 76
72 77 # Matches a lone LF, i.e., one that is not part of CRLF.
73 78 singlelf = re.compile('(^|[^\r])\n')
74 79 # Matches a single EOL which can either be a CRLF where repeated CR
75 80 # are removed or a LF. We do not care about old Machintosh files, so a
76 81 # stray CR is an error.
77 82 eolre = re.compile('\r*\n')
78 83
79 84
80 85 def inconsistenteol(data):
81 86 return '\r\n' in data and singlelf.search(data)
82 87
83 88 def tolf(s, params, ui, **kwargs):
84 89 """Filter to convert to LF EOLs."""
85 90 if util.binary(s):
86 91 return s
87 92 if ui.configbool('eol', 'only-consistent', True) and inconsistenteol(s):
88 93 return s
89 94 return eolre.sub('\n', s)
90 95
91 96 def tocrlf(s, params, ui, **kwargs):
92 97 """Filter to convert to CRLF EOLs."""
93 98 if util.binary(s):
94 99 return s
95 100 if ui.configbool('eol', 'only-consistent', True) and inconsistenteol(s):
96 101 return s
97 102 return eolre.sub('\r\n', s)
98 103
99 104 def isbinary(s, params):
100 105 """Filter to do nothing with the file."""
101 106 return s
102 107
103 108 filters = {
104 109 'to-lf': tolf,
105 110 'to-crlf': tocrlf,
106 111 'is-binary': isbinary,
107 112 }
108 113
109 114
110 115 def hook(ui, repo, node, hooktype, **kwargs):
111 116 """verify that files have expected EOLs"""
112 117 files = set()
113 118 for rev in xrange(repo[node].rev(), len(repo)):
114 119 files.update(repo[rev].files())
115 120 tip = repo['tip']
116 121 for f in files:
117 122 if f not in tip:
118 123 continue
119 124 for pattern, target in ui.configitems('encode'):
120 125 if match.match(repo.root, '', [pattern])(f):
121 126 data = tip[f].data()
122 127 if target == "to-lf" and "\r\n" in data:
123 128 raise util.Abort(_("%s should not have CRLF line endings")
124 129 % f)
125 130 elif target == "to-crlf" and singlelf.search(data):
126 131 raise util.Abort(_("%s should not have LF line endings")
127 132 % f)
128 133
129 134
130 135 def preupdate(ui, repo, hooktype, parent1, parent2):
131 136 #print "preupdate for %s: %s -> %s" % (repo.root, parent1, parent2)
132 137 repo.readhgeol(parent1)
133 138 return False
134 139
135 140 def uisetup(ui):
136 141 ui.setconfig('hooks', 'preupdate.eol', preupdate)
137 142
138 143 def extsetup(ui):
139 144 try:
140 145 extensions.find('win32text')
141 146 raise util.Abort(_("the eol extension is incompatible with the "
142 147 "win32text extension"))
143 148 except KeyError:
144 149 pass
145 150
146 151
147 152 def reposetup(ui, repo):
148 153 uisetup(repo.ui)
149 154 #print "reposetup for", repo.root
150 155
151 156 if not repo.local():
152 157 return
153 158 for name, fn in filters.iteritems():
154 159 repo.adddatafilter(name, fn)
155 160
156 161 ui.setconfig('patch', 'eol', 'auto')
157 162
158 163 class eolrepo(repo.__class__):
159 164
160 165 _decode = {'LF': 'to-lf', 'CRLF': 'to-crlf', 'BIN': 'is-binary'}
161 166 _encode = {'LF': 'to-lf', 'CRLF': 'to-crlf', 'BIN': 'is-binary'}
162 167
163 168 def readhgeol(self, node=None, data=None):
164 169 if data is None:
165 170 try:
166 171 if node is None:
167 172 data = self.wfile('.hgeol').read()
168 173 else:
169 174 data = self[node]['.hgeol'].data()
170 175 except (IOError, LookupError):
171 176 return None
172 177
173 178 if self.ui.config('eol', 'native', os.linesep) in ('LF', '\n'):
174 179 self._decode['NATIVE'] = 'to-lf'
175 180 else:
176 181 self._decode['NATIVE'] = 'to-crlf'
177 182
178 183 eol = config.config()
179 184 # Our files should not be touched. The pattern must be
180 185 # inserted first override a '** = native' pattern.
181 186 eol.set('patterns', '.hg*', 'BIN')
182 187 # We can then parse the user's patterns.
183 188 eol.parse('.hgeol', data)
184 189
185 190 if eol.get('repository', 'native') == 'CRLF':
186 191 self._encode['NATIVE'] = 'to-crlf'
187 192 else:
188 193 self._encode['NATIVE'] = 'to-lf'
189 194
190 195 for pattern, style in eol.items('patterns'):
191 196 key = style.upper()
192 197 try:
193 198 self.ui.setconfig('decode', pattern, self._decode[key])
194 199 self.ui.setconfig('encode', pattern, self._encode[key])
195 200 except KeyError:
196 201 self.ui.warn(_("ignoring unknown EOL style '%s' from %s\n")
197 202 % (style, eol.source('patterns', pattern)))
198 203
199 204 include = []
200 205 exclude = []
201 206 for pattern, style in eol.items('patterns'):
202 207 key = style.upper()
203 208 if key == 'BIN':
204 209 exclude.append(pattern)
205 210 else:
206 211 include.append(pattern)
207 212
208 213 # This will match the files for which we need to care
209 214 # about inconsistent newlines.
210 215 return match.match(self.root, '', [], include, exclude)
211 216
212 217 def _hgcleardirstate(self):
213 218 self._eolfile = self.readhgeol() or self.readhgeol('tip')
214 219
215 220 if not self._eolfile:
216 221 self._eolfile = util.never
217 222 return
218 223
219 224 try:
220 225 cachemtime = os.path.getmtime(self.join("eol.cache"))
221 226 except OSError:
222 227 cachemtime = 0
223 228
224 229 try:
225 230 eolmtime = os.path.getmtime(self.wjoin(".hgeol"))
226 231 except OSError:
227 232 eolmtime = 0
228 233
229 234 if eolmtime > cachemtime:
230 235 ui.debug("eol: detected change in .hgeol\n")
231 236 # TODO: we could introduce a method for this in dirstate.
232 237 wlock = None
233 238 try:
234 239 wlock = self.wlock()
235 240 for f, e in self.dirstate._map.iteritems():
236 241 self.dirstate._map[f] = (e[0], e[1], -1, 0)
237 242 self.dirstate._dirty = True
238 243 # Touch the cache to update mtime. TODO: are we sure this
239 244 # always enought to update the mtime, or should we write a
240 245 # bit to the file?
241 246 self.opener("eol.cache", "w").close()
242 247 finally:
243 248 if wlock is not None:
244 249 wlock.release()
245 250
246 251 def commitctx(self, ctx, error=False):
247 252 for f in sorted(ctx.added() + ctx.modified()):
248 253 if not self._eolfile(f):
249 254 continue
250 255 data = ctx[f].data()
251 256 if util.binary(data):
252 257 # We should not abort here, since the user should
253 258 # be able to say "** = native" to automatically
254 259 # have all non-binary files taken care of.
255 260 continue
256 261 if inconsistenteol(data):
257 262 raise util.Abort(_("inconsistent newline style "
258 263 "in %s\n" % f))
259 264 return super(eolrepo, self).commitctx(ctx, error)
260 265 repo.__class__ = eolrepo
261 266 repo._hgcleardirstate()
General Comments 0
You need to be logged in to leave comments. Login now