upstream/mercurial-mirror Files · mercurial/thirdparty/tomli/_parser.py

rhg: ignore readonly FS error when saving dirstate...

rhg: ignore readonly FS error when saving dirstate The error is already ignored when the .hg directory is read-only, so this is only fair. (the python hg is silent on readonly fs, too)

Raphaël Gomès - - Load All Authors

File last commit:

r51654:2c34c9b6 default


                r52652:955084b4

stable

Download file

             _parser.py
        
                    663 lines
            
             | 21.1 KiB
            
                | text/x-python
            
             |
                PythonLexer
            
             / mercurial / thirdparty / tomli / _parser.py
          
                    History
                
                 |
                  Source
                 | Raw
                 |Copy content
                 |Copy permalink

        Raphaël Gomès
    
thirdparty: vendor tomli...

              r51654
            
      import string

      from types import MappingProxyType

      from typing import Any, BinaryIO, Dict, FrozenSet, Iterable, NamedTuple, Optional, Tuple

      import warnings

      from ._re import (

          RE_DATETIME,

          RE_LOCALTIME,

          RE_NUMBER,

          match_to_datetime,

          match_to_localtime,

          match_to_number,

      )

      from ._types import Key, ParseFloat, Pos

      ASCII_CTRL = frozenset(chr(i) for i in range(32)) | frozenset(chr(127))

      # Neither of these sets include quotation mark or backslash. They are

      # currently handled as separate cases in the parser functions.

      ILLEGAL_BASIC_STR_CHARS = ASCII_CTRL - frozenset("\t")

      ILLEGAL_MULTILINE_BASIC_STR_CHARS = ASCII_CTRL - frozenset("\t\n")

      ILLEGAL_LITERAL_STR_CHARS = ILLEGAL_BASIC_STR_CHARS

      ILLEGAL_MULTILINE_LITERAL_STR_CHARS = ILLEGAL_MULTILINE_BASIC_STR_CHARS

      ILLEGAL_COMMENT_CHARS = ILLEGAL_BASIC_STR_CHARS

      TOML_WS = frozenset(" \t")

      TOML_WS_AND_NEWLINE = TOML_WS | frozenset("\n")

      BARE_KEY_CHARS = frozenset(string.ascii_letters + string.digits + "-_")

      KEY_INITIAL_CHARS = BARE_KEY_CHARS | frozenset("\"'")

      HEXDIGIT_CHARS = frozenset(string.hexdigits)

      BASIC_STR_ESCAPE_REPLACEMENTS = MappingProxyType(

          {

              "\\b": "\u0008",  # backspace

              "\\t": "\u0009",  # tab

              "\\n": "\u000A",  # linefeed

              "\\f": "\u000C",  # form feed

              "\\r": "\u000D",  # carriage return

              '\\"': "\u0022",  # quote

              "\\\\": "\u005C",  # backslash

          }

      )

      class TOMLDecodeError(ValueError):

          """An error raised if a document is not valid TOML."""

      def load(fp: BinaryIO, *, parse_float: ParseFloat = float) -> Dict[str, Any]:

          """Parse TOML from a binary file object."""

          s_bytes = fp.read()

          try:

              s = s_bytes.decode()

          except AttributeError:

              warnings.warn(

                  "Text file object support is deprecated in favor of binary file objects."

                  ' Use `open("foo.toml", "rb")` to open the file in binary mode.',

                  DeprecationWarning,

                  stacklevel=2,

              )

              s = s_bytes  # type: ignore[assignment]

          return loads(s, parse_float=parse_float)

      def loads(s: str, *, parse_float: ParseFloat = float) -> Dict[str, Any]:  # noqa: C901

          """Parse TOML from a string."""

          # The spec allows converting "\r\n" to "\n", even in string

          # literals. Let's do so to simplify parsing.

          src = s.replace("\r\n", "\n")

          pos = 0

          out = Output(NestedDict(), Flags())

          header: Key = ()

          # Parse one statement at a time

          # (typically means one line in TOML source)

          while True:

              # 1. Skip line leading whitespace

              pos = skip_chars(src, pos, TOML_WS)

              # 2. Parse rules. Expect one of the following:

              #    - end of file

              #    - end of line

              #    - comment

              #    - key/value pair

              #    - append dict to list (and move to its namespace)

              #    - create dict (and move to its namespace)

              # Skip trailing whitespace when applicable.

              try:

                  char = src[pos]

              except IndexError:

                  break

              if char == "\n":

                  pos += 1

                  continue

              if char in KEY_INITIAL_CHARS:

                  pos = key_value_rule(src, pos, out, header, parse_float)

                  pos = skip_chars(src, pos, TOML_WS)

              elif char == "[":

                  try:

                      second_char: Optional[str] = src[pos + 1]

                  except IndexError:

                      second_char = None

                  if second_char == "[":

                      pos, header = create_list_rule(src, pos, out)

                  else:

                      pos, header = create_dict_rule(src, pos, out)

                  pos = skip_chars(src, pos, TOML_WS)

              elif char != "#":

                  raise suffixed_err(src, pos, "Invalid statement")

              # 3. Skip comment

              pos = skip_comment(src, pos)

              # 4. Expect end of line or end of file

              try:

                  char = src[pos]

              except IndexError:

                  break

              if char != "\n":

                  raise suffixed_err(

                      src, pos, "Expected newline or end of document after a statement"

                  )

              pos += 1

          return out.data.dict

      class Flags:

          """Flags that map to parsed keys/namespaces."""

          # Marks an immutable namespace (inline array or inline table).

          FROZEN = 0

          # Marks a nest that has been explicitly created and can no longer

          # be opened using the "[table]" syntax.

          EXPLICIT_NEST = 1

          def __init__(self) -> None:

              self._flags: Dict[str, dict] = {}

          def unset_all(self, key: Key) -> None:

              cont = self._flags

              for k in key[:-1]:

                  if k not in cont:

                      return

                  cont = cont[k]["nested"]

              cont.pop(key[-1], None)

          def set_for_relative_key(self, head_key: Key, rel_key: Key, flag: int) -> None:

              cont = self._flags

              for k in head_key:

                  if k not in cont:

                      cont[k] = {"flags": set(), "recursive_flags": set(), "nested": {}}

                  cont = cont[k]["nested"]

              for k in rel_key:

                  if k in cont:

                      cont[k]["flags"].add(flag)

                  else:

                      cont[k] = {"flags": {flag}, "recursive_flags": set(), "nested": {}}

                  cont = cont[k]["nested"]

          def set(self, key: Key, flag: int, *, recursive: bool) -> None:  # noqa: A003

              cont = self._flags

              key_parent, key_stem = key[:-1], key[-1]

              for k in key_parent:

                  if k not in cont:

                      cont[k] = {"flags": set(), "recursive_flags": set(), "nested": {}}

                  cont = cont[k]["nested"]

              if key_stem not in cont:

                  cont[key_stem] = {"flags": set(), "recursive_flags": set(), "nested": {}}

              cont[key_stem]["recursive_flags" if recursive else "flags"].add(flag)

          def is_(self, key: Key, flag: int) -> bool:

              if not key:

                  return False  # document root has no flags

              cont = self._flags

              for k in key[:-1]:

                  if k not in cont:

                      return False

                  inner_cont = cont[k]

                  if flag in inner_cont["recursive_flags"]:

                      return True

                  cont = inner_cont["nested"]

              key_stem = key[-1]

              if key_stem in cont:

                  cont = cont[key_stem]

                  return flag in cont["flags"] or flag in cont["recursive_flags"]

              return False

      class NestedDict:

          def __init__(self) -> None:

              # The parsed content of the TOML document

              self.dict: Dict[str, Any] = {}

          def get_or_create_nest(

              self,

              key: Key,

              *,

              access_lists: bool = True,

          ) -> dict:

              cont: Any = self.dict

              for k in key:

                  if k not in cont:

                      cont[k] = {}

                  cont = cont[k]

                  if access_lists and isinstance(cont, list):

                      cont = cont[-1]

                  if not isinstance(cont, dict):

                      raise KeyError("There is no nest behind this key")

              return cont

          def append_nest_to_list(self, key: Key) -> None:

              cont = self.get_or_create_nest(key[:-1])

              last_key = key[-1]

              if last_key in cont:

                  list_ = cont[last_key]

                  try:

                      list_.append({})

                  except AttributeError:

                      raise KeyError("An object other than list found behind this key")

              else:

                  cont[last_key] = [{}]

      class Output(NamedTuple):

          data: NestedDict

          flags: Flags

      def skip_chars(src: str, pos: Pos, chars: Iterable[str]) -> Pos:

          try:

              while src[pos] in chars:

                  pos += 1

          except IndexError:

              pass

          return pos

      def skip_until(

          src: str,

          pos: Pos,

          expect: str,

          *,

          error_on: FrozenSet[str],

          error_on_eof: bool,

      ) -> Pos:

          try:

              new_pos = src.index(expect, pos)

          except ValueError:

              new_pos = len(src)

              if error_on_eof:

                  raise suffixed_err(src, new_pos, f"Expected {expect!r}") from None

          if not error_on.isdisjoint(src[pos:new_pos]):

              while src[pos] not in error_on:

                  pos += 1

              raise suffixed_err(src, pos, f"Found invalid character {src[pos]!r}")

          return new_pos

      def skip_comment(src: str, pos: Pos) -> Pos:

          try:

              char: Optional[str] = src[pos]

          except IndexError:

              char = None

          if char == "#":

              return skip_until(

                  src, pos + 1, "\n", error_on=ILLEGAL_COMMENT_CHARS, error_on_eof=False

              )

          return pos

      def skip_comments_and_array_ws(src: str, pos: Pos) -> Pos:

          while True:

              pos_before_skip = pos

              pos = skip_chars(src, pos, TOML_WS_AND_NEWLINE)

              pos = skip_comment(src, pos)

              if pos == pos_before_skip:

                  return pos

      def create_dict_rule(src: str, pos: Pos, out: Output) -> Tuple[Pos, Key]:

          pos += 1  # Skip "["

          pos = skip_chars(src, pos, TOML_WS)

          pos, key = parse_key(src, pos)

          if out.flags.is_(key, Flags.EXPLICIT_NEST) or out.flags.is_(key, Flags.FROZEN):

              raise suffixed_err(src, pos, f"Can not declare {key} twice")

          out.flags.set(key, Flags.EXPLICIT_NEST, recursive=False)

          try:

              out.data.get_or_create_nest(key)

          except KeyError:

              raise suffixed_err(src, pos, "Can not overwrite a value") from None

          if not src.startswith("]", pos):

              raise suffixed_err(src, pos, 'Expected "]" at the end of a table declaration')

          return pos + 1, key

      def create_list_rule(src: str, pos: Pos, out: Output) -> Tuple[Pos, Key]:

          pos += 2  # Skip "[["

          pos = skip_chars(src, pos, TOML_WS)

          pos, key = parse_key(src, pos)

          if out.flags.is_(key, Flags.FROZEN):

              raise suffixed_err(src, pos, f"Can not mutate immutable namespace {key}")

          # Free the namespace now that it points to another empty list item...

          out.flags.unset_all(key)

          # ...but this key precisely is still prohibited from table declaration

          out.flags.set(key, Flags.EXPLICIT_NEST, recursive=False)

          try:

              out.data.append_nest_to_list(key)

          except KeyError:

              raise suffixed_err(src, pos, "Can not overwrite a value") from None

          if not src.startswith("]]", pos):

              raise suffixed_err(src, pos, 'Expected "]]" at the end of an array declaration')

          return pos + 2, key

      def key_value_rule(

          src: str, pos: Pos, out: Output, header: Key, parse_float: ParseFloat

      ) -> Pos:

          pos, key, value = parse_key_value_pair(src, pos, parse_float)

          key_parent, key_stem = key[:-1], key[-1]

          abs_key_parent = header + key_parent

          if out.flags.is_(abs_key_parent, Flags.FROZEN):

              raise suffixed_err(

                  src, pos, f"Can not mutate immutable namespace {abs_key_parent}"

              )

          # Containers in the relative path can't be opened with the table syntax after this

          out.flags.set_for_relative_key(header, key, Flags.EXPLICIT_NEST)

          try:

              nest = out.data.get_or_create_nest(abs_key_parent)

          except KeyError:

              raise suffixed_err(src, pos, "Can not overwrite a value") from None

          if key_stem in nest:

              raise suffixed_err(src, pos, "Can not overwrite a value")

          # Mark inline table and array namespaces recursively immutable

          if isinstance(value, (dict, list)):

              out.flags.set(header + key, Flags.FROZEN, recursive=True)

          nest[key_stem] = value

          return pos

      def parse_key_value_pair(

          src: str, pos: Pos, parse_float: ParseFloat

      ) -> Tuple[Pos, Key, Any]:

          pos, key = parse_key(src, pos)

          try:

              char: Optional[str] = src[pos]

          except IndexError:

              char = None

          if char != "=":

              raise suffixed_err(src, pos, 'Expected "=" after a key in a key/value pair')

          pos += 1

          pos = skip_chars(src, pos, TOML_WS)

          pos, value = parse_value(src, pos, parse_float)

          return pos, key, value

      def parse_key(src: str, pos: Pos) -> Tuple[Pos, Key]:

          pos, key_part = parse_key_part(src, pos)

          key: Key = (key_part,)

          pos = skip_chars(src, pos, TOML_WS)

          while True:

              try:

                  char: Optional[str] = src[pos]

              except IndexError:

                  char = None

              if char != ".":

                  return pos, key

              pos += 1

              pos = skip_chars(src, pos, TOML_WS)

              pos, key_part = parse_key_part(src, pos)

              key += (key_part,)

              pos = skip_chars(src, pos, TOML_WS)

      def parse_key_part(src: str, pos: Pos) -> Tuple[Pos, str]:

          try:

              char: Optional[str] = src[pos]

          except IndexError:

              char = None

          if char in BARE_KEY_CHARS:

              start_pos = pos

              pos = skip_chars(src, pos, BARE_KEY_CHARS)

              return pos, src[start_pos:pos]

          if char == "'":

              return parse_literal_str(src, pos)

          if char == '"':

              return parse_one_line_basic_str(src, pos)

          raise suffixed_err(src, pos, "Invalid initial character for a key part")

      def parse_one_line_basic_str(src: str, pos: Pos) -> Tuple[Pos, str]:

          pos += 1

          return parse_basic_str(src, pos, multiline=False)

      def parse_array(src: str, pos: Pos, parse_float: ParseFloat) -> Tuple[Pos, list]:

          pos += 1

          array: list = []

          pos = skip_comments_and_array_ws(src, pos)

          if src.startswith("]", pos):

              return pos + 1, array

          while True:

              pos, val = parse_value(src, pos, parse_float)

              array.append(val)

              pos = skip_comments_and_array_ws(src, pos)

              c = src[pos : pos + 1]

              if c == "]":

                  return pos + 1, array

              if c != ",":

                  raise suffixed_err(src, pos, "Unclosed array")

              pos += 1

              pos = skip_comments_and_array_ws(src, pos)

              if src.startswith("]", pos):

                  return pos + 1, array

      def parse_inline_table(src: str, pos: Pos, parse_float: ParseFloat) -> Tuple[Pos, dict]:

          pos += 1

          nested_dict = NestedDict()

          flags = Flags()

          pos = skip_chars(src, pos, TOML_WS)

          if src.startswith("}", pos):

              return pos + 1, nested_dict.dict

          while True:

              pos, key, value = parse_key_value_pair(src, pos, parse_float)

              key_parent, key_stem = key[:-1], key[-1]

              if flags.is_(key, Flags.FROZEN):

                  raise suffixed_err(src, pos, f"Can not mutate immutable namespace {key}")

              try:

                  nest = nested_dict.get_or_create_nest(key_parent, access_lists=False)

              except KeyError:

                  raise suffixed_err(src, pos, "Can not overwrite a value") from None

              if key_stem in nest:

                  raise suffixed_err(src, pos, f"Duplicate inline table key {key_stem!r}")

              nest[key_stem] = value

              pos = skip_chars(src, pos, TOML_WS)

              c = src[pos : pos + 1]

              if c == "}":

                  return pos + 1, nested_dict.dict

              if c != ",":

                  raise suffixed_err(src, pos, "Unclosed inline table")

              if isinstance(value, (dict, list)):

                  flags.set(key, Flags.FROZEN, recursive=True)

              pos += 1

              pos = skip_chars(src, pos, TOML_WS)

      def parse_basic_str_escape(  # noqa: C901

          src: str, pos: Pos, *, multiline: bool = False

      ) -> Tuple[Pos, str]:

          escape_id = src[pos : pos + 2]

          pos += 2

          if multiline and escape_id in {"\\ ", "\\\t", "\\\n"}:

              # Skip whitespace until next non-whitespace character or end of

              # the doc. Error if non-whitespace is found before newline.

              if escape_id != "\\\n":

                  pos = skip_chars(src, pos, TOML_WS)

                  try:

                      char = src[pos]

                  except IndexError:

                      return pos, ""

                  if char != "\n":

                      raise suffixed_err(src, pos, 'Unescaped "\\" in a string')

                  pos += 1

              pos = skip_chars(src, pos, TOML_WS_AND_NEWLINE)

              return pos, ""

          if escape_id == "\\u":

              return parse_hex_char(src, pos, 4)

          if escape_id == "\\U":

              return parse_hex_char(src, pos, 8)

          try:

              return pos, BASIC_STR_ESCAPE_REPLACEMENTS[escape_id]

          except KeyError:

              if len(escape_id) != 2:

                  raise suffixed_err(src, pos, "Unterminated string") from None

              raise suffixed_err(src, pos, 'Unescaped "\\" in a string') from None

      def parse_basic_str_escape_multiline(src: str, pos: Pos) -> Tuple[Pos, str]:

          return parse_basic_str_escape(src, pos, multiline=True)

      def parse_hex_char(src: str, pos: Pos, hex_len: int) -> Tuple[Pos, str]:

          hex_str = src[pos : pos + hex_len]

          if len(hex_str) != hex_len or not HEXDIGIT_CHARS.issuperset(hex_str):

              raise suffixed_err(src, pos, "Invalid hex value")

          pos += hex_len

          hex_int = int(hex_str, 16)

          if not is_unicode_scalar_value(hex_int):

              raise suffixed_err(src, pos, "Escaped character is not a Unicode scalar value")

          return pos, chr(hex_int)

      def parse_literal_str(src: str, pos: Pos) -> Tuple[Pos, str]:

          pos += 1  # Skip starting apostrophe

          start_pos = pos

          pos = skip_until(

              src, pos, "'", error_on=ILLEGAL_LITERAL_STR_CHARS, error_on_eof=True

          )

          return pos + 1, src[start_pos:pos]  # Skip ending apostrophe

      def parse_multiline_str(src: str, pos: Pos, *, literal: bool) -> Tuple[Pos, str]:

          pos += 3

          if src.startswith("\n", pos):

              pos += 1

          if literal:

              delim = "'"

              end_pos = skip_until(

                  src,

                  pos,

                  "'''",

                  error_on=ILLEGAL_MULTILINE_LITERAL_STR_CHARS,

                  error_on_eof=True,

              )

              result = src[pos:end_pos]

              pos = end_pos + 3

          else:

              delim = '"'

              pos, result = parse_basic_str(src, pos, multiline=True)

          # Add at maximum two extra apostrophes/quotes if the end sequence

          # is 4 or 5 chars long instead of just 3.

          if not src.startswith(delim, pos):

              return pos, result

          pos += 1

          if not src.startswith(delim, pos):

              return pos, result + delim

          pos += 1

          return pos, result + (delim * 2)

      def parse_basic_str(src: str, pos: Pos, *, multiline: bool) -> Tuple[Pos, str]:

          if multiline:

              error_on = ILLEGAL_MULTILINE_BASIC_STR_CHARS

              parse_escapes = parse_basic_str_escape_multiline

          else:

              error_on = ILLEGAL_BASIC_STR_CHARS

              parse_escapes = parse_basic_str_escape

          result = ""

          start_pos = pos

          while True:

              try:

                  char = src[pos]

              except IndexError:

                  raise suffixed_err(src, pos, "Unterminated string") from None

              if char == '"':

                  if not multiline:

                      return pos + 1, result + src[start_pos:pos]

                  if src.startswith('"""', pos):

                      return pos + 3, result + src[start_pos:pos]

                  pos += 1

                  continue

              if char == "\\":

                  result += src[start_pos:pos]

                  pos, parsed_escape = parse_escapes(src, pos)

                  result += parsed_escape

                  start_pos = pos

                  continue

              if char in error_on:

                  raise suffixed_err(src, pos, f"Illegal character {char!r}")

              pos += 1

      def parse_value(  # noqa: C901

          src: str, pos: Pos, parse_float: ParseFloat

      ) -> Tuple[Pos, Any]:

          try:

              char: Optional[str] = src[pos]

          except IndexError:

              char = None

          # Basic strings

          if char == '"':

              if src.startswith('"""', pos):

                  return parse_multiline_str(src, pos, literal=False)

              return parse_one_line_basic_str(src, pos)

          # Literal strings

          if char == "'":

              if src.startswith("'''", pos):

                  return parse_multiline_str(src, pos, literal=True)

              return parse_literal_str(src, pos)

          # Booleans

          if char == "t":

              if src.startswith("true", pos):

                  return pos + 4, True

          if char == "f":

              if src.startswith("false", pos):

                  return pos + 5, False

          # Dates and times

          datetime_match = RE_DATETIME.match(src, pos)

          if datetime_match:

              try:

                  datetime_obj = match_to_datetime(datetime_match)

              except ValueError as e:

                  raise suffixed_err(src, pos, "Invalid date or datetime") from e

              return datetime_match.end(), datetime_obj

          localtime_match = RE_LOCALTIME.match(src, pos)

          if localtime_match:

              return localtime_match.end(), match_to_localtime(localtime_match)

          # Integers and "normal" floats.

          # The regex will greedily match any type starting with a decimal

          # char, so needs to be located after handling of dates and times.

          number_match = RE_NUMBER.match(src, pos)

          if number_match:

              return number_match.end(), match_to_number(number_match, parse_float)

          # Arrays

          if char == "[":

              return parse_array(src, pos, parse_float)

          # Inline tables

          if char == "{":

              return parse_inline_table(src, pos, parse_float)

          # Special floats

          first_three = src[pos : pos + 3]

          if first_three in {"inf", "nan"}:

              return pos + 3, parse_float(first_three)

          first_four = src[pos : pos + 4]

          if first_four in {"-inf", "+inf", "-nan", "+nan"}:

              return pos + 4, parse_float(first_four)

          raise suffixed_err(src, pos, "Invalid value")

      def suffixed_err(src: str, pos: Pos, msg: str) -> TOMLDecodeError:

          """Return a `TOMLDecodeError` where error message is suffixed with

          coordinates in source."""

          def coord_repr(src: str, pos: Pos) -> str:

              if pos >= len(src):

                  return "end of document"

              line = src.count("\n", 0, pos) + 1

              if line == 1:

                  column = pos + 1

              else:

                  column = pos - src.rindex("\n", 0, pos)

              return f"line {line}, column {column}"

          return TOMLDecodeError(f"{msg} (at {coord_repr(src, pos)})")

      def is_unicode_scalar_value(codepoint: int) -> bool:

          return (0 <= codepoint <= 55295) or (57344 <= codepoint <= 1114111)

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

Raphaël Gomès thirdparty: vendor tomli...	r51654	import string
		from types import MappingProxyType
		from typing import Any, BinaryIO, Dict, FrozenSet, Iterable, NamedTuple, Optional, Tuple
		import warnings

		from ._re import (
		RE_DATETIME,
		RE_LOCALTIME,
		RE_NUMBER,
		match_to_datetime,
		match_to_localtime,
		match_to_number,
		)
		from ._types import Key, ParseFloat, Pos

		ASCII_CTRL = frozenset(chr(i) for i in range(32)) \| frozenset(chr(127))

		# Neither of these sets include quotation mark or backslash. They are
		# currently handled as separate cases in the parser functions.
		ILLEGAL_BASIC_STR_CHARS = ASCII_CTRL - frozenset("\t")
		ILLEGAL_MULTILINE_BASIC_STR_CHARS = ASCII_CTRL - frozenset("\t\n")

		ILLEGAL_LITERAL_STR_CHARS = ILLEGAL_BASIC_STR_CHARS
		ILLEGAL_MULTILINE_LITERAL_STR_CHARS = ILLEGAL_MULTILINE_BASIC_STR_CHARS

		ILLEGAL_COMMENT_CHARS = ILLEGAL_BASIC_STR_CHARS

		TOML_WS = frozenset(" \t")
		TOML_WS_AND_NEWLINE = TOML_WS \| frozenset("\n")
		BARE_KEY_CHARS = frozenset(string.ascii_letters + string.digits + "-_")
		KEY_INITIAL_CHARS = BARE_KEY_CHARS \| frozenset("\"'")
		HEXDIGIT_CHARS = frozenset(string.hexdigits)

		BASIC_STR_ESCAPE_REPLACEMENTS = MappingProxyType(
		{
		"\\b": "\u0008", # backspace
		"\\t": "\u0009", # tab
		"\\n": "\u000A", # linefeed
		"\\f": "\u000C", # form feed
		"\\r": "\u000D", # carriage return
		'\\"': "\u0022", # quote
		"\\\\": "\u005C", # backslash
		}
		)


		class TOMLDecodeError(ValueError):
		"""An error raised if a document is not valid TOML."""


		def load(fp: BinaryIO, *, parse_float: ParseFloat = float) -> Dict[str, Any]:
		"""Parse TOML from a binary file object."""
		s_bytes = fp.read()
		try:
		s = s_bytes.decode()
		except AttributeError:
		warnings.warn(
		"Text file object support is deprecated in favor of binary file objects."
		' Use `open("foo.toml", "rb")` to open the file in binary mode.',
		DeprecationWarning,
		stacklevel=2,
		)
		s = s_bytes # type: ignore[assignment]
		return loads(s, parse_float=parse_float)


		def loads(s: str, *, parse_float: ParseFloat = float) -> Dict[str, Any]: # noqa: C901
		"""Parse TOML from a string."""

		# The spec allows converting "\r\n" to "\n", even in string
		# literals. Let's do so to simplify parsing.
		src = s.replace("\r\n", "\n")
		pos = 0
		out = Output(NestedDict(), Flags())
		header: Key = ()

		# Parse one statement at a time
		# (typically means one line in TOML source)
		while True:
		# 1. Skip line leading whitespace
		pos = skip_chars(src, pos, TOML_WS)

		# 2. Parse rules. Expect one of the following:
		# - end of file
		# - end of line
		# - comment
		# - key/value pair
		# - append dict to list (and move to its namespace)
		# - create dict (and move to its namespace)
		# Skip trailing whitespace when applicable.
		try:
		char = src[pos]
		except IndexError:
		break
		if char == "\n":
		pos += 1
		continue
		if char in KEY_INITIAL_CHARS:
		pos = key_value_rule(src, pos, out, header, parse_float)
		pos = skip_chars(src, pos, TOML_WS)
		elif char == "[":
		try:
		second_char: Optional[str] = src[pos + 1]
		except IndexError:
		second_char = None
		if second_char == "[":
		pos, header = create_list_rule(src, pos, out)
		else:
		pos, header = create_dict_rule(src, pos, out)
		pos = skip_chars(src, pos, TOML_WS)
		elif char != "#":
		raise suffixed_err(src, pos, "Invalid statement")

		# 3. Skip comment
		pos = skip_comment(src, pos)

		# 4. Expect end of line or end of file
		try:
		char = src[pos]
		except IndexError:
		break
		if char != "\n":
		raise suffixed_err(
		src, pos, "Expected newline or end of document after a statement"
		)
		pos += 1

		return out.data.dict


		class Flags:
		"""Flags that map to parsed keys/namespaces."""

		# Marks an immutable namespace (inline array or inline table).
		FROZEN = 0
		# Marks a nest that has been explicitly created and can no longer
		# be opened using the "[table]" syntax.
		EXPLICIT_NEST = 1

		def __init__(self) -> None:
		self._flags: Dict[str, dict] = {}

		def unset_all(self, key: Key) -> None:
		cont = self._flags
		for k in key[:-1]:
		if k not in cont:
		return
		cont = cont[k]["nested"]
		cont.pop(key[-1], None)

		def set_for_relative_key(self, head_key: Key, rel_key: Key, flag: int) -> None:
		cont = self._flags
		for k in head_key:
		if k not in cont:
		cont[k] = {"flags": set(), "recursive_flags": set(), "nested": {}}
		cont = cont[k]["nested"]
		for k in rel_key:
		if k in cont:
		cont[k]["flags"].add(flag)
		else:
		cont[k] = {"flags": {flag}, "recursive_flags": set(), "nested": {}}
		cont = cont[k]["nested"]

		def set(self, key: Key, flag: int, *, recursive: bool) -> None: # noqa: A003
		cont = self._flags
		key_parent, key_stem = key[:-1], key[-1]
		for k in key_parent:
		if k not in cont:
		cont[k] = {"flags": set(), "recursive_flags": set(), "nested": {}}
		cont = cont[k]["nested"]
		if key_stem not in cont:
		cont[key_stem] = {"flags": set(), "recursive_flags": set(), "nested": {}}
		cont[key_stem]["recursive_flags" if recursive else "flags"].add(flag)

		def is_(self, key: Key, flag: int) -> bool:
		if not key:
		return False # document root has no flags
		cont = self._flags
		for k in key[:-1]:
		if k not in cont:
		return False
		inner_cont = cont[k]
		if flag in inner_cont["recursive_flags"]:
		return True
		cont = inner_cont["nested"]
		key_stem = key[-1]
		if key_stem in cont:
		cont = cont[key_stem]
		return flag in cont["flags"] or flag in cont["recursive_flags"]
		return False


		class NestedDict:
		def __init__(self) -> None:
		# The parsed content of the TOML document
		self.dict: Dict[str, Any] = {}

		def get_or_create_nest(
		self,
		key: Key,
		*,
		access_lists: bool = True,
		) -> dict:
		cont: Any = self.dict
		for k in key:
		if k not in cont:
		cont[k] = {}
		cont = cont[k]
		if access_lists and isinstance(cont, list):
		cont = cont[-1]
		if not isinstance(cont, dict):
		raise KeyError("There is no nest behind this key")
		return cont

		def append_nest_to_list(self, key: Key) -> None:
		cont = self.get_or_create_nest(key[:-1])
		last_key = key[-1]
		if last_key in cont:
		list_ = cont[last_key]
		try:
		list_.append({})
		except AttributeError:
		raise KeyError("An object other than list found behind this key")
		else:
		cont[last_key] = [{}]


		class Output(NamedTuple):
		data: NestedDict
		flags: Flags


		def skip_chars(src: str, pos: Pos, chars: Iterable[str]) -> Pos:
		try:
		while src[pos] in chars:
		pos += 1
		except IndexError:
		pass
		return pos


		def skip_until(
		src: str,
		pos: Pos,
		expect: str,
		*,
		error_on: FrozenSet[str],
		error_on_eof: bool,
		) -> Pos:
		try:
		new_pos = src.index(expect, pos)
		except ValueError:
		new_pos = len(src)
		if error_on_eof:
		raise suffixed_err(src, new_pos, f"Expected {expect!r}") from None

		if not error_on.isdisjoint(src[pos:new_pos]):
		while src[pos] not in error_on:
		pos += 1
		raise suffixed_err(src, pos, f"Found invalid character {src[pos]!r}")
		return new_pos


		def skip_comment(src: str, pos: Pos) -> Pos:
		try:
		char: Optional[str] = src[pos]
		except IndexError:
		char = None
		if char == "#":
		return skip_until(
		src, pos + 1, "\n", error_on=ILLEGAL_COMMENT_CHARS, error_on_eof=False
		)
		return pos


		def skip_comments_and_array_ws(src: str, pos: Pos) -> Pos:
		while True:
		pos_before_skip = pos
		pos = skip_chars(src, pos, TOML_WS_AND_NEWLINE)
		pos = skip_comment(src, pos)
		if pos == pos_before_skip:
		return pos


		def create_dict_rule(src: str, pos: Pos, out: Output) -> Tuple[Pos, Key]:
		pos += 1 # Skip "["
		pos = skip_chars(src, pos, TOML_WS)
		pos, key = parse_key(src, pos)

		if out.flags.is_(key, Flags.EXPLICIT_NEST) or out.flags.is_(key, Flags.FROZEN):
		raise suffixed_err(src, pos, f"Can not declare {key} twice")
		out.flags.set(key, Flags.EXPLICIT_NEST, recursive=False)
		try:
		out.data.get_or_create_nest(key)
		except KeyError:
		raise suffixed_err(src, pos, "Can not overwrite a value") from None

		if not src.startswith("]", pos):
		raise suffixed_err(src, pos, 'Expected "]" at the end of a table declaration')
		return pos + 1, key


		def create_list_rule(src: str, pos: Pos, out: Output) -> Tuple[Pos, Key]:
		pos += 2 # Skip "[["
		pos = skip_chars(src, pos, TOML_WS)
		pos, key = parse_key(src, pos)

		if out.flags.is_(key, Flags.FROZEN):
		raise suffixed_err(src, pos, f"Can not mutate immutable namespace {key}")
		# Free the namespace now that it points to another empty list item...
		out.flags.unset_all(key)
		# ...but this key precisely is still prohibited from table declaration
		out.flags.set(key, Flags.EXPLICIT_NEST, recursive=False)
		try:
		out.data.append_nest_to_list(key)
		except KeyError:
		raise suffixed_err(src, pos, "Can not overwrite a value") from None

		if not src.startswith("]]", pos):
		raise suffixed_err(src, pos, 'Expected "]]" at the end of an array declaration')
		return pos + 2, key


		def key_value_rule(
		src: str, pos: Pos, out: Output, header: Key, parse_float: ParseFloat
		) -> Pos:
		pos, key, value = parse_key_value_pair(src, pos, parse_float)
		key_parent, key_stem = key[:-1], key[-1]
		abs_key_parent = header + key_parent

		if out.flags.is_(abs_key_parent, Flags.FROZEN):
		raise suffixed_err(
		src, pos, f"Can not mutate immutable namespace {abs_key_parent}"
		)
		# Containers in the relative path can't be opened with the table syntax after this
		out.flags.set_for_relative_key(header, key, Flags.EXPLICIT_NEST)
		try:
		nest = out.data.get_or_create_nest(abs_key_parent)
		except KeyError:
		raise suffixed_err(src, pos, "Can not overwrite a value") from None
		if key_stem in nest:
		raise suffixed_err(src, pos, "Can not overwrite a value")
		# Mark inline table and array namespaces recursively immutable
		if isinstance(value, (dict, list)):
		out.flags.set(header + key, Flags.FROZEN, recursive=True)
		nest[key_stem] = value
		return pos


		def parse_key_value_pair(
		src: str, pos: Pos, parse_float: ParseFloat
		) -> Tuple[Pos, Key, Any]:
		pos, key = parse_key(src, pos)
		try:
		char: Optional[str] = src[pos]
		except IndexError:
		char = None
		if char != "=":
		raise suffixed_err(src, pos, 'Expected "=" after a key in a key/value pair')
		pos += 1
		pos = skip_chars(src, pos, TOML_WS)
		pos, value = parse_value(src, pos, parse_float)
		return pos, key, value


		def parse_key(src: str, pos: Pos) -> Tuple[Pos, Key]:
		pos, key_part = parse_key_part(src, pos)
		key: Key = (key_part,)
		pos = skip_chars(src, pos, TOML_WS)
		while True:
		try:
		char: Optional[str] = src[pos]
		except IndexError:
		char = None
		if char != ".":
		return pos, key
		pos += 1
		pos = skip_chars(src, pos, TOML_WS)
		pos, key_part = parse_key_part(src, pos)
		key += (key_part,)
		pos = skip_chars(src, pos, TOML_WS)


		def parse_key_part(src: str, pos: Pos) -> Tuple[Pos, str]:
		try:
		char: Optional[str] = src[pos]
		except IndexError:
		char = None
		if char in BARE_KEY_CHARS:
		start_pos = pos
		pos = skip_chars(src, pos, BARE_KEY_CHARS)
		return pos, src[start_pos:pos]
		if char == "'":
		return parse_literal_str(src, pos)
		if char == '"':
		return parse_one_line_basic_str(src, pos)
		raise suffixed_err(src, pos, "Invalid initial character for a key part")


		def parse_one_line_basic_str(src: str, pos: Pos) -> Tuple[Pos, str]:
		pos += 1
		return parse_basic_str(src, pos, multiline=False)


		def parse_array(src: str, pos: Pos, parse_float: ParseFloat) -> Tuple[Pos, list]:
		pos += 1
		array: list = []

		pos = skip_comments_and_array_ws(src, pos)
		if src.startswith("]", pos):
		return pos + 1, array
		while True:
		pos, val = parse_value(src, pos, parse_float)
		array.append(val)
		pos = skip_comments_and_array_ws(src, pos)

		c = src[pos : pos + 1]
		if c == "]":
		return pos + 1, array
		if c != ",":
		raise suffixed_err(src, pos, "Unclosed array")
		pos += 1

		pos = skip_comments_and_array_ws(src, pos)
		if src.startswith("]", pos):
		return pos + 1, array


		def parse_inline_table(src: str, pos: Pos, parse_float: ParseFloat) -> Tuple[Pos, dict]:
		pos += 1
		nested_dict = NestedDict()
		flags = Flags()

		pos = skip_chars(src, pos, TOML_WS)
		if src.startswith("}", pos):
		return pos + 1, nested_dict.dict
		while True:
		pos, key, value = parse_key_value_pair(src, pos, parse_float)
		key_parent, key_stem = key[:-1], key[-1]
		if flags.is_(key, Flags.FROZEN):
		raise suffixed_err(src, pos, f"Can not mutate immutable namespace {key}")
		try:
		nest = nested_dict.get_or_create_nest(key_parent, access_lists=False)
		except KeyError:
		raise suffixed_err(src, pos, "Can not overwrite a value") from None
		if key_stem in nest:
		raise suffixed_err(src, pos, f"Duplicate inline table key {key_stem!r}")
		nest[key_stem] = value
		pos = skip_chars(src, pos, TOML_WS)
		c = src[pos : pos + 1]
		if c == "}":
		return pos + 1, nested_dict.dict
		if c != ",":
		raise suffixed_err(src, pos, "Unclosed inline table")
		if isinstance(value, (dict, list)):
		flags.set(key, Flags.FROZEN, recursive=True)
		pos += 1
		pos = skip_chars(src, pos, TOML_WS)


		def parse_basic_str_escape( # noqa: C901
		src: str, pos: Pos, *, multiline: bool = False
		) -> Tuple[Pos, str]:
		escape_id = src[pos : pos + 2]
		pos += 2
		if multiline and escape_id in {"\\ ", "\\\t", "\\\n"}:
		# Skip whitespace until next non-whitespace character or end of
		# the doc. Error if non-whitespace is found before newline.
		if escape_id != "\\\n":
		pos = skip_chars(src, pos, TOML_WS)
		try:
		char = src[pos]
		except IndexError:
		return pos, ""
		if char != "\n":
		raise suffixed_err(src, pos, 'Unescaped "\\" in a string')
		pos += 1
		pos = skip_chars(src, pos, TOML_WS_AND_NEWLINE)
		return pos, ""
		if escape_id == "\\u":
		return parse_hex_char(src, pos, 4)
		if escape_id == "\\U":
		return parse_hex_char(src, pos, 8)
		try:
		return pos, BASIC_STR_ESCAPE_REPLACEMENTS[escape_id]
		except KeyError:
		if len(escape_id) != 2:
		raise suffixed_err(src, pos, "Unterminated string") from None
		raise suffixed_err(src, pos, 'Unescaped "\\" in a string') from None


		def parse_basic_str_escape_multiline(src: str, pos: Pos) -> Tuple[Pos, str]:
		return parse_basic_str_escape(src, pos, multiline=True)


		def parse_hex_char(src: str, pos: Pos, hex_len: int) -> Tuple[Pos, str]:
		hex_str = src[pos : pos + hex_len]
		if len(hex_str) != hex_len or not HEXDIGIT_CHARS.issuperset(hex_str):
		raise suffixed_err(src, pos, "Invalid hex value")
		pos += hex_len
		hex_int = int(hex_str, 16)
		if not is_unicode_scalar_value(hex_int):
		raise suffixed_err(src, pos, "Escaped character is not a Unicode scalar value")
		return pos, chr(hex_int)


		def parse_literal_str(src: str, pos: Pos) -> Tuple[Pos, str]:
		pos += 1 # Skip starting apostrophe
		start_pos = pos
		pos = skip_until(
		src, pos, "'", error_on=ILLEGAL_LITERAL_STR_CHARS, error_on_eof=True
		)
		return pos + 1, src[start_pos:pos] # Skip ending apostrophe


		def parse_multiline_str(src: str, pos: Pos, *, literal: bool) -> Tuple[Pos, str]:
		pos += 3
		if src.startswith("\n", pos):
		pos += 1

		if literal:
		delim = "'"
		end_pos = skip_until(
		src,
		pos,
		"'''",
		error_on=ILLEGAL_MULTILINE_LITERAL_STR_CHARS,
		error_on_eof=True,
		)
		result = src[pos:end_pos]
		pos = end_pos + 3
		else:
		delim = '"'
		pos, result = parse_basic_str(src, pos, multiline=True)

		# Add at maximum two extra apostrophes/quotes if the end sequence
		# is 4 or 5 chars long instead of just 3.
		if not src.startswith(delim, pos):
		return pos, result
		pos += 1
		if not src.startswith(delim, pos):
		return pos, result + delim
		pos += 1
		return pos, result + (delim * 2)


		def parse_basic_str(src: str, pos: Pos, *, multiline: bool) -> Tuple[Pos, str]:
		if multiline:
		error_on = ILLEGAL_MULTILINE_BASIC_STR_CHARS
		parse_escapes = parse_basic_str_escape_multiline
		else:
		error_on = ILLEGAL_BASIC_STR_CHARS
		parse_escapes = parse_basic_str_escape
		result = ""
		start_pos = pos
		while True:
		try:
		char = src[pos]
		except IndexError:
		raise suffixed_err(src, pos, "Unterminated string") from None
		if char == '"':
		if not multiline:
		return pos + 1, result + src[start_pos:pos]
		if src.startswith('"""', pos):
		return pos + 3, result + src[start_pos:pos]
		pos += 1
		continue
		if char == "\\":
		result += src[start_pos:pos]
		pos, parsed_escape = parse_escapes(src, pos)
		result += parsed_escape
		start_pos = pos
		continue
		if char in error_on:
		raise suffixed_err(src, pos, f"Illegal character {char!r}")
		pos += 1


		def parse_value( # noqa: C901
		src: str, pos: Pos, parse_float: ParseFloat
		) -> Tuple[Pos, Any]:
		try:
		char: Optional[str] = src[pos]
		except IndexError:
		char = None

		# Basic strings
		if char == '"':
		if src.startswith('"""', pos):
		return parse_multiline_str(src, pos, literal=False)
		return parse_one_line_basic_str(src, pos)

		# Literal strings
		if char == "'":
		if src.startswith("'''", pos):
		return parse_multiline_str(src, pos, literal=True)
		return parse_literal_str(src, pos)

		# Booleans
		if char == "t":
		if src.startswith("true", pos):
		return pos + 4, True
		if char == "f":
		if src.startswith("false", pos):
		return pos + 5, False

		# Dates and times
		datetime_match = RE_DATETIME.match(src, pos)
		if datetime_match:
		try:
		datetime_obj = match_to_datetime(datetime_match)
		except ValueError as e:
		raise suffixed_err(src, pos, "Invalid date or datetime") from e
		return datetime_match.end(), datetime_obj
		localtime_match = RE_LOCALTIME.match(src, pos)
		if localtime_match:
		return localtime_match.end(), match_to_localtime(localtime_match)

		# Integers and "normal" floats.
		# The regex will greedily match any type starting with a decimal
		# char, so needs to be located after handling of dates and times.
		number_match = RE_NUMBER.match(src, pos)
		if number_match:
		return number_match.end(), match_to_number(number_match, parse_float)

		# Arrays
		if char == "[":
		return parse_array(src, pos, parse_float)

		# Inline tables
		if char == "{":
		return parse_inline_table(src, pos, parse_float)

		# Special floats
		first_three = src[pos : pos + 3]
		if first_three in {"inf", "nan"}:
		return pos + 3, parse_float(first_three)
		first_four = src[pos : pos + 4]
		if first_four in {"-inf", "+inf", "-nan", "+nan"}:
		return pos + 4, parse_float(first_four)

		raise suffixed_err(src, pos, "Invalid value")


		def suffixed_err(src: str, pos: Pos, msg: str) -> TOMLDecodeError:
		"""Return a `TOMLDecodeError` where error message is suffixed with
		coordinates in source."""

		def coord_repr(src: str, pos: Pos) -> str:
		if pos >= len(src):
		return "end of document"
		line = src.count("\n", 0, pos) + 1
		if line == 1:
		column = pos + 1
		else:
		column = pos - src.rindex("\n", 0, pos)
		return f"line {line}, column {column}"

		return TOMLDecodeError(f"{msg} (at {coord_repr(src, pos)})")


		def is_unicode_scalar_value(codepoint: int) -> bool:
		return (0 <= codepoint <= 55295) or (57344 <= codepoint <= 1114111)