win32text.py
249 lines
| 7.5 KiB
| text/x-python
|
PythonLexer
/ hgext / win32text.py
OHASHI Hideya
|
r6481 | # win32text.py - LF <-> CRLF/CR translation utilities for Windows/Mac users | ||
Jesse Glick
|
r5675 | # | ||
Raphaël Gomès
|
r47575 | # Copyright 2005, 2007-2009 Olivia Mackall <olivia@selenic.com> and others | ||
Martin Geisler
|
r8253 | # | ||
# This software may be used and distributed according to the terms of the | ||||
Matt Mackall
|
r10263 | # GNU General Public License version 2 or any later version. | ||
Dirkjan Ochtman
|
r8873 | |||
Matt Mackall
|
r20624 | '''perform automatic newline conversion (DEPRECATED) | ||
Dirkjan Ochtman
|
r8873 | |||
Martin Geisler
|
r11269 | Deprecation: The win32text extension requires each user to configure | ||
the extension again and again for each clone since the configuration | ||||
is not copied when cloning. | ||||
We have therefore made the ``eol`` as an alternative. The ``eol`` | ||||
uses a version controlled file for its configuration and each clone | ||||
will therefore use the right settings from the start. | ||||
Martin Geisler
|
r9217 | To perform automatic newline conversion, use:: | ||
Dirkjan Ochtman
|
r8873 | |||
Martin Geisler
|
r9217 | [extensions] | ||
Martin Geisler
|
r10112 | win32text = | ||
Martin Geisler
|
r9217 | [encode] | ||
** = cleverencode: | ||||
# or ** = macencode: | ||||
Dirkjan Ochtman
|
r8873 | |||
Martin Geisler
|
r9217 | [decode] | ||
** = cleverdecode: | ||||
# or ** = macdecode: | ||||
Dirkjan Ochtman
|
r8873 | |||
Martin Geisler
|
r9217 | If not doing conversion, to make sure you do not commit CRLF/CR by accident:: | ||
Dirkjan Ochtman
|
r8873 | |||
Martin Geisler
|
r9217 | [hooks] | ||
pretxncommit.crlf = python:hgext.win32text.forbidcrlf | ||||
# or pretxncommit.cr = python:hgext.win32text.forbidcr | ||||
Dirkjan Ochtman
|
r8873 | |||
To do the same check on a server to prevent CRLF/CR from being | ||||
Martin Geisler
|
r9217 | pushed or pulled:: | ||
Dirkjan Ochtman
|
r8873 | |||
Martin Geisler
|
r9217 | [hooks] | ||
pretxnchangegroup.crlf = python:hgext.win32text.forbidcrlf | ||||
# or pretxnchangegroup.cr = python:hgext.win32text.forbidcr | ||||
Dirkjan Ochtman
|
r8873 | ''' | ||
Jesse Glick
|
r5675 | |||
Matt Harbison
|
r52756 | from __future__ import annotations | ||
Pulkit Goyal
|
r29485 | |||
import re | ||||
Martin Geisler
|
r7225 | from mercurial.i18n import _ | ||
Augie Fackler
|
r43346 | from mercurial.node import short | ||
Pulkit Goyal
|
r29485 | from mercurial import ( | ||
r49211 | cmdutil, | |||
extensions, | ||||
Boris Feld
|
r34186 | registrar, | ||
Yuya Nishihara
|
r37102 | ) | ||
Augie Fackler
|
r43346 | from mercurial.utils import stringutil | ||
Lee Cantey
|
r4859 | |||
Augie Fackler
|
r29841 | # Note for extension authors: ONLY specify testedwith = 'ships-with-hg-core' for | ||
Augie Fackler
|
r25186 | # extensions which SHIP WITH MERCURIAL. Non-mainline extensions should | ||
# be specifying the version(s) of Mercurial they are tested with, or | ||||
# leave the attribute unspecified. | ||||
Augie Fackler
|
r43347 | testedwith = b'ships-with-hg-core' | ||
Augie Fackler
|
r16743 | |||
Boris Feld
|
r34186 | configtable = {} | ||
configitem = registrar.configitem(configtable) | ||||
Augie Fackler
|
r43346 | configitem( | ||
Augie Fackler
|
r46554 | b'win32text', | ||
b'warn', | ||||
default=True, | ||||
Boris Feld
|
r34186 | ) | ||
Lee Cantey
|
r4859 | # regexp for single LF without CR preceding. | ||
Augie Fackler
|
r43347 | re_single_lf = re.compile(b'(^|[^\r])\n', re.MULTILINE) | ||
Lee Cantey
|
r4859 | |||
Augie Fackler
|
r43347 | newlinestr = {b'\r\n': b'CRLF', b'\r': b'CR'} | ||
filterstr = {b'\r\n': b'clever', b'\r': b'mac'} | ||||
OHASHI Hideya
|
r6481 | |||
Augie Fackler
|
r43346 | |||
OHASHI Hideya
|
r6481 | def checknewline(s, newline, ui=None, repo=None, filename=None): | ||
# warn if already has 'newline' in repository. | ||||
Lee Cantey
|
r4859 | # it might cause unexpected eol conversion. | ||
# see issue 302: | ||||
Matt Mackall
|
r26420 | # https://bz.mercurial-scm.org/302 | ||
OHASHI Hideya
|
r6481 | if newline in s and ui and filename and repo: | ||
Augie Fackler
|
r43346 | ui.warn( | ||
_( | ||||
Augie Fackler
|
r43347 | b'WARNING: %s already has %s line endings\n' | ||
b'and does not need EOL conversion by the win32text plugin.\n' | ||||
b'Before your next commit, please reconsider your ' | ||||
b'encode/decode settings in \nMercurial.ini or %s.\n' | ||||
Augie Fackler
|
r43346 | ) | ||
Augie Fackler
|
r43347 | % (filename, newlinestr[newline], repo.vfs.join(b'hgrc')) | ||
Augie Fackler
|
r43346 | ) | ||
OHASHI Hideya
|
r6481 | |||
def dumbdecode(s, cmd, **kwargs): | ||||
Augie Fackler
|
r43347 | checknewline(s, b'\r\n', **kwargs) | ||
Lee Cantey
|
r4859 | # replace single LF to CRLF | ||
Augie Fackler
|
r43347 | return re_single_lf.sub(b'\\1\r\n', s) | ||
Lee Cantey
|
r4859 | |||
Augie Fackler
|
r43346 | |||
Lee Cantey
|
r4859 | def dumbencode(s, cmd): | ||
Augie Fackler
|
r43347 | return s.replace(b'\r\n', b'\n') | ||
Lee Cantey
|
r4859 | |||
Augie Fackler
|
r43346 | |||
OHASHI Hideya
|
r6481 | def macdumbdecode(s, cmd, **kwargs): | ||
Augie Fackler
|
r43347 | checknewline(s, b'\r', **kwargs) | ||
return s.replace(b'\n', b'\r') | ||||
OHASHI Hideya
|
r6481 | |||
Augie Fackler
|
r43346 | |||
OHASHI Hideya
|
r6481 | def macdumbencode(s, cmd): | ||
Augie Fackler
|
r43347 | return s.replace(b'\r', b'\n') | ||
OHASHI Hideya
|
r6481 | |||
Augie Fackler
|
r43346 | |||
Jesse Glick
|
r5967 | def cleverdecode(s, cmd, **kwargs): | ||
Yuya Nishihara
|
r37102 | if not stringutil.binary(s): | ||
Patrick Mezard
|
r6473 | return dumbdecode(s, cmd, **kwargs) | ||
return s | ||||
Lee Cantey
|
r4859 | |||
Augie Fackler
|
r43346 | |||
Lee Cantey
|
r4859 | def cleverencode(s, cmd): | ||
Yuya Nishihara
|
r37102 | if not stringutil.binary(s): | ||
Patrick Mezard
|
r6473 | return dumbencode(s, cmd) | ||
return s | ||||
Lee Cantey
|
r4859 | |||
Augie Fackler
|
r43346 | |||
OHASHI Hideya
|
r6481 | def macdecode(s, cmd, **kwargs): | ||
Yuya Nishihara
|
r37102 | if not stringutil.binary(s): | ||
Patrick Mezard
|
r6484 | return macdumbdecode(s, cmd, **kwargs) | ||
return s | ||||
OHASHI Hideya
|
r6481 | |||
Augie Fackler
|
r43346 | |||
OHASHI Hideya
|
r6481 | def macencode(s, cmd): | ||
Yuya Nishihara
|
r37102 | if not stringutil.binary(s): | ||
Patrick Mezard
|
r6484 | return macdumbencode(s, cmd) | ||
return s | ||||
OHASHI Hideya
|
r6481 | |||
Augie Fackler
|
r43346 | |||
Patrick Mezard
|
r5966 | _filters = { | ||
Augie Fackler
|
r43347 | b'dumbdecode:': dumbdecode, | ||
b'dumbencode:': dumbencode, | ||||
b'cleverdecode:': cleverdecode, | ||||
b'cleverencode:': cleverencode, | ||||
b'macdumbdecode:': macdumbdecode, | ||||
b'macdumbencode:': macdumbencode, | ||||
b'macdecode:': macdecode, | ||||
b'macencode:': macencode, | ||||
Augie Fackler
|
r43346 | } | ||
Jesse Glick
|
r5675 | |||
Patrick Mezard
|
r6483 | def forbidnewline(ui, repo, hooktype, node, newline, **kwargs): | ||
Jesse Glick
|
r5675 | halt = False | ||
Martin Geisler
|
r8150 | seen = set() | ||
Bryan O'Sullivan
|
r8147 | # we try to walk changesets in reverse order from newest to | ||
# oldest, so that if we see a file multiple times, we take the | ||||
# newest version as canonical. this prevents us from blocking a | ||||
# changegroup that contains an unacceptable commit followed later | ||||
# by a commit that fixes the problem. | ||||
Augie Fackler
|
r43347 | tip = repo[b'tip'] | ||
Manuel Jacob
|
r50179 | for rev in range(repo.changelog.tiprev(), repo[node].rev() - 1, -1): | ||
Matt Mackall
|
r6747 | c = repo[rev] | ||
Jesse Glick
|
r5675 | for f in c.files(): | ||
Bryan O'Sullivan
|
r8147 | if f in seen or f not in tip or f not in c: | ||
Jesse Glick
|
r5675 | continue | ||
Bryan O'Sullivan
|
r8147 | seen.add(f) | ||
Jesse Glick
|
r5675 | data = c[f].data() | ||
Yuya Nishihara
|
r37102 | if not stringutil.binary(data) and newline in data: | ||
Jesse Glick
|
r5675 | if not halt: | ||
Augie Fackler
|
r43346 | ui.warn( | ||
_( | ||||
Augie Fackler
|
r43347 | b'attempt to commit or push text file(s) ' | ||
b'using %s line endings\n' | ||||
Augie Fackler
|
r43346 | ) | ||
% newlinestr[newline] | ||||
) | ||||
Augie Fackler
|
r43347 | ui.warn(_(b'in %s: %s\n') % (short(c.node()), f)) | ||
Jesse Glick
|
r5675 | halt = True | ||
Augie Fackler
|
r43347 | if halt and hooktype == b'pretxnchangegroup': | ||
OHASHI Hideya
|
r6481 | crlf = newlinestr[newline].lower() | ||
filter = filterstr[newline] | ||||
Augie Fackler
|
r43346 | ui.warn( | ||
_( | ||||
Augie Fackler
|
r43347 | b'\nTo prevent this mistake in your local repository,\n' | ||
b'add to Mercurial.ini or .hg/hgrc:\n' | ||||
b'\n' | ||||
b'[hooks]\n' | ||||
b'pretxncommit.%s = python:hgext.win32text.forbid%s\n' | ||||
b'\n' | ||||
b'and also consider adding:\n' | ||||
b'\n' | ||||
b'[extensions]\n' | ||||
b'win32text =\n' | ||||
b'[encode]\n' | ||||
b'** = %sencode:\n' | ||||
b'[decode]\n' | ||||
b'** = %sdecode:\n' | ||||
Augie Fackler
|
r43346 | ) | ||
% (crlf, crlf, filter, filter) | ||||
) | ||||
Jesse Glick
|
r5675 | return halt | ||
Patrick Mezard
|
r5966 | |||
Augie Fackler
|
r43346 | |||
OHASHI Hideya
|
r6481 | def forbidcrlf(ui, repo, hooktype, node, **kwargs): | ||
Augie Fackler
|
r43347 | return forbidnewline(ui, repo, hooktype, node, b'\r\n', **kwargs) | ||
OHASHI Hideya
|
r6481 | |||
Augie Fackler
|
r43346 | |||
OHASHI Hideya
|
r6481 | def forbidcr(ui, repo, hooktype, node, **kwargs): | ||
Augie Fackler
|
r43347 | return forbidnewline(ui, repo, hooktype, node, b'\r', **kwargs) | ||
OHASHI Hideya
|
r6481 | |||
Augie Fackler
|
r43346 | |||
Patrick Mezard
|
r5966 | def reposetup(ui, repo): | ||
if not repo.local(): | ||||
return | ||||
Gregory Szorc
|
r49768 | for name, fn in _filters.items(): | ||
Patrick Mezard
|
r5966 | repo.adddatafilter(name, fn) | ||
Augie Fackler
|
r43346 | |||
r49211 | def wrap_revert(orig, repo, ctx, names, uipathfn, actions, *args, **kwargs): | |||
# reset dirstate cache for file we touch | ||||
ds = repo.dirstate | ||||
r50908 | for filename in actions[b'revert'][0]: | |||
entry = ds.get_entry(filename) | ||||
if entry is not None: | ||||
if entry.p1_tracked: | ||||
# If we revert the file, it is possibly dirty. However, | ||||
# this extension meddle with the file content and therefore | ||||
# its size. As a result, we cannot simply call | ||||
# `dirstate.set_possibly_dirty` as it will not affet the | ||||
# expected size of the file. | ||||
# | ||||
# At least, now, the quirk is properly documented. | ||||
ds.hacky_extension_update_file( | ||||
filename, | ||||
entry.tracked, | ||||
r50909 | p1_tracked=entry.p1_tracked, | |||
r50908 | p2_info=entry.p2_info, | |||
) | ||||
r49211 | return orig(repo, ctx, names, uipathfn, actions, *args, **kwargs) | |||
Steve Borho
|
r12837 | def extsetup(ui): | ||
Matt Mackall
|
r25829 | # deprecated config: win32text.warn | ||
Augie Fackler
|
r43347 | if ui.configbool(b'win32text', b'warn'): | ||
Augie Fackler
|
r43346 | ui.warn( | ||
_( | ||||
Augie Fackler
|
r43347 | b"win32text is deprecated: " | ||
b"https://mercurial-scm.org/wiki/Win32TextExtension\n" | ||||
Augie Fackler
|
r43346 | ) | ||
) | ||||
r49211 | extensions.wrapfunction(cmdutil, '_performrevert', wrap_revert) | |||