upstream/mercurial-mirror Files · mercurial/pure/charencode.py

interfaces: add a Protocol class for `scmutil.status`...

interfaces: add a Protocol class for `scmutil.status` I initially tried moving this to the `interfaces` package, both to have more cleanly defined interfaces (interfaces shouldn't have to reach into implementation files for their type info), and because importing `mercurial.ui` either directly or indirectly into `interfaces.repository` causes a situation where pytype stops inferring the type for `revlogutils.constants` that are imported by `revlog`. (Likely this is caused by a cycle. The `dirstate` interface already imports `scmutil`, which in turn imports `ui`, so the `repository` interface module importing the `dirstate` interface module as part of converting those classes to Protocol classes will trigger the issue.) I gave up on moving the class because `scmutil.status` depends on `stringutil`, which has a surprisingly long tail of dependencies. In any event, a standalone Protocol class might help with the Rust code.

Matt Harbison - - Load All Authors

File last commit:

r52755:607e94e0 default


                r53347:a1c0f19e

default

Download file

             charencode.py
        
                    87 lines
            
             | 2.4 KiB
            
                | text/x-python
            
             |
                PythonLexer
            
             / mercurial / pure / charencode.py
          
                    History
                
                 |
                  Annotation
                 | Raw
                 |Copy content
                 |Copy permalink

      # charencode.py - miscellaneous character encoding

      #

      #  Copyright 2005-2009 Olivia Mackall <olivia@selenic.com> and others

      #

      # This software may be used and distributed according to the terms of the

      # GNU General Public License version 2 or any later version.

      from __future__ import annotations

      import array

      from .. import pycompat

      def isasciistr(s: bytes) -> bool:

          try:

              s.decode('ascii')

              return True

          except UnicodeDecodeError:

              return False

      def asciilower(s: bytes) -> bytes:

          """convert a string to lowercase if ASCII

          Raises UnicodeDecodeError if non-ASCII characters are found."""

          s.decode('ascii')

          return s.lower()

      def asciiupper(s: bytes) -> bytes:

          """convert a string to uppercase if ASCII

          Raises UnicodeDecodeError if non-ASCII characters are found."""

          s.decode('ascii')

          return s.upper()

      _jsonmap = []

      _jsonmap.extend(b"\\u%04x" % x for x in range(32))

      _jsonmap.extend(pycompat.bytechr(x) for x in range(32, 127))

      _jsonmap.append(b'\\u007f')

      _jsonmap[0x09] = b'\\t'

      _jsonmap[0x0A] = b'\\n'

      _jsonmap[0x22] = b'\\"'

      _jsonmap[0x5C] = b'\\\\'

      _jsonmap[0x08] = b'\\b'

      _jsonmap[0x0C] = b'\\f'

      _jsonmap[0x0D] = b'\\r'

      _paranoidjsonmap = _jsonmap[:]

      _paranoidjsonmap[0x3C] = b'\\u003c'  # '<' (e.g. escape "</script>")

      _paranoidjsonmap[0x3E] = b'\\u003e'  # '>'

      _jsonmap.extend(pycompat.bytechr(x) for x in range(128, 256))

      def jsonescapeu8fast(u8chars: bytes, paranoid: bool) -> bytes:

          """Convert a UTF-8 byte string to JSON-escaped form (fast path)

          Raises ValueError if non-ASCII characters have to be escaped.

          """

          if paranoid:

              jm = _paranoidjsonmap

          else:

              jm = _jsonmap

          try:

              return b''.join(jm[x] for x in bytearray(u8chars))

          except IndexError:

              raise ValueError

      _utf8strict = r'surrogatepass'

      def jsonescapeu8fallback(u8chars: bytes, paranoid: bool) -> bytes:

          """Convert a UTF-8 byte string to JSON-escaped form (slow path)

          Escapes all non-ASCII characters no matter if paranoid is False.

          """

          if paranoid:

              jm = _paranoidjsonmap

          else:

              jm = _jsonmap

          # non-BMP char is represented as UTF-16 surrogate pair

          u16b = u8chars.decode('utf-8', _utf8strict).encode('utf-16', _utf8strict)

          u16codes = array.array('H', u16b)

          u16codes.pop(0)  # drop BOM

          return b''.join(jm[x] if x < 128 else b'\\u%04x' % x for x in u16codes)

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

				# charencode.py - miscellaneous character encoding
				#
				# Copyright 2005-2009 Olivia Mackall <olivia@selenic.com> and others
				#
				# This software may be used and distributed according to the terms of the
				# GNU General Public License version 2 or any later version.

				from __future__ import annotations

				import array

				from .. import pycompat


				def isasciistr(s: bytes) -> bool:
				try:
				s.decode('ascii')
				return True
				except UnicodeDecodeError:
				return False


				def asciilower(s: bytes) -> bytes:
				"""convert a string to lowercase if ASCII

				Raises UnicodeDecodeError if non-ASCII characters are found."""
				s.decode('ascii')
				return s.lower()


				def asciiupper(s: bytes) -> bytes:
				"""convert a string to uppercase if ASCII

				Raises UnicodeDecodeError if non-ASCII characters are found."""
				s.decode('ascii')
				return s.upper()


				_jsonmap = []
				_jsonmap.extend(b"\\u%04x" % x for x in range(32))
				_jsonmap.extend(pycompat.bytechr(x) for x in range(32, 127))
				_jsonmap.append(b'\\u007f')
				_jsonmap[0x09] = b'\\t'
				_jsonmap[0x0A] = b'\\n'
				_jsonmap[0x22] = b'\\"'
				_jsonmap[0x5C] = b'\\\\'
				_jsonmap[0x08] = b'\\b'
				_jsonmap[0x0C] = b'\\f'
				_jsonmap[0x0D] = b'\\r'
				_paranoidjsonmap = _jsonmap[:]
				_paranoidjsonmap[0x3C] = b'\\u003c' # '<' (e.g. escape "</script>")
				_paranoidjsonmap[0x3E] = b'\\u003e' # '>'
				_jsonmap.extend(pycompat.bytechr(x) for x in range(128, 256))


				def jsonescapeu8fast(u8chars: bytes, paranoid: bool) -> bytes:
				"""Convert a UTF-8 byte string to JSON-escaped form (fast path)

				Raises ValueError if non-ASCII characters have to be escaped.
				"""
				if paranoid:
				jm = _paranoidjsonmap
				else:
				jm = _jsonmap
				try:
				return b''.join(jm[x] for x in bytearray(u8chars))
				except IndexError:
				raise ValueError


				_utf8strict = r'surrogatepass'


				def jsonescapeu8fallback(u8chars: bytes, paranoid: bool) -> bytes:
				"""Convert a UTF-8 byte string to JSON-escaped form (slow path)

				Escapes all non-ASCII characters no matter if paranoid is False.
				"""
				if paranoid:
				jm = _paranoidjsonmap
				else:
				jm = _jsonmap
				# non-BMP char is represented as UTF-16 surrogate pair
				u16b = u8chars.decode('utf-8', _utf8strict).encode('utf-16', _utf8strict)
				u16codes = array.array('H', u16b)
				u16codes.pop(0) # drop BOM
				return b''.join(jm[x] if x < 128 else b'\\u%04x' % x for x in u16codes)