upstream/mercurial-mirror Files · contrib/automation/hgautomation/try_server.py

memory-usage: fix `hg log --follow --rev R F` space complexity...

memory-usage: fix `hg log --follow --rev R F` space complexity When running `hg log --follow --rev REVS FILES`, the log code will walk the history of all FILES starting from the file revisions that exists in each REVS. Before doing so, it looks if the files actually exists in the target revisions. To do so, it opens the manifest of each revision in REVS to look up if we find the associated items in FILES. Before this changeset this was done in a way that created a changectx for each target revision, keeping them in memory while we look into each file. If the set of REVS is large, this means keeping the manifest for each entry in REVS in memory. That can be large… if REV is in the form `::X`, this can quickly become huge and saturate the memory. We have seen usage allocating 2GB per second until memory runs out. So this changeset invert the two loop so that only one revision is kept in memory during the operation. This solve the memory explosion issue.

Gregory Szorc - - Load All Authors

File last commit:

r43327:c5c502bd default


                r50517:dcb2581e

stable

Download file

             try_server.py
        
                    99 lines
            
             | 2.4 KiB
            
                | text/x-python
            
             |
                PythonLexer
            
             / contrib / automation / hgautomation / try_server.py
          
                    History
                
                 |
                  Annotation
                 | Raw
                 |Copy content
                 |Copy permalink

      # try_server.py - Interact with Try server

      #

      # Copyright 2019 Gregory Szorc <gregory.szorc@gmail.com>

      #

      # This software may be used and distributed according to the terms of the

      # GNU General Public License version 2 or any later version.

      # no-check-code because Python 3 native.

      import base64

      import json

      import os

      import subprocess

      import tempfile

      from .aws import AWSConnection

      LAMBDA_FUNCTION = "ci-try-server-upload"

      def trigger_try(c: AWSConnection, rev="."):

          """Trigger a new Try run."""

          lambda_client = c.session.client("lambda")

          cset, bundle = generate_bundle(rev=rev)

          payload = {

              "bundle": base64.b64encode(bundle).decode("utf-8"),

              "node": cset["node"],

              "branch": cset["branch"],

              "user": cset["user"],

              "message": cset["desc"],

          }

          print("resolved revision:")

          print("node: %s" % cset["node"])

          print("branch: %s" % cset["branch"])

          print("user: %s" % cset["user"])

          print("desc: %s" % cset["desc"].splitlines()[0])

          print()

          print("sending to Try...")

          res = lambda_client.invoke(

              FunctionName=LAMBDA_FUNCTION,

              InvocationType="RequestResponse",

              Payload=json.dumps(payload).encode("utf-8"),

          )

          body = json.load(res["Payload"])

          for message in body:

              print("remote: %s" % message)

      def generate_bundle(rev="."):

          """Generate a bundle suitable for use by the Try service.

          Returns a tuple of revision metadata and raw Mercurial bundle data.

          """

          # `hg bundle` doesn't support streaming to stdout. So we use a temporary

          # file.

          path = None

          try:

              fd, path = tempfile.mkstemp(prefix="hg-bundle-", suffix=".hg")

              os.close(fd)

              args = [

                  "hg",

                  "bundle",

                  "--type",

                  "gzip-v2",

                  "--base",

                  "public()",

                  "--rev",

                  rev,

                  path,

              ]

              print("generating bundle...")

              subprocess.run(args, check=True)

              with open(path, "rb") as fh:

                  bundle_data = fh.read()

          finally:

              if path:

                  os.unlink(path)

          args = [

              "hg",

              "log",

              "-r",

              rev,

              # We have to upload as JSON, so it won't matter if we emit binary

              # since we need to normalize to UTF-8.

              "-T",

              "json",

          ]

          res = subprocess.run(args, check=True, capture_output=True)

          return json.loads(res.stdout)[0], bundle_data

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

				# try_server.py - Interact with Try server
				#
				# Copyright 2019 Gregory Szorc <gregory.szorc@gmail.com>
				#
				# This software may be used and distributed according to the terms of the
				# GNU General Public License version 2 or any later version.

				# no-check-code because Python 3 native.

				import base64
				import json
				import os
				import subprocess
				import tempfile

				from .aws import AWSConnection

				LAMBDA_FUNCTION = "ci-try-server-upload"


				def trigger_try(c: AWSConnection, rev="."):
				"""Trigger a new Try run."""
				lambda_client = c.session.client("lambda")

				cset, bundle = generate_bundle(rev=rev)

				payload = {
				"bundle": base64.b64encode(bundle).decode("utf-8"),
				"node": cset["node"],
				"branch": cset["branch"],
				"user": cset["user"],
				"message": cset["desc"],
				}

				print("resolved revision:")
				print("node: %s" % cset["node"])
				print("branch: %s" % cset["branch"])
				print("user: %s" % cset["user"])
				print("desc: %s" % cset["desc"].splitlines()[0])
				print()

				print("sending to Try...")
				res = lambda_client.invoke(
				FunctionName=LAMBDA_FUNCTION,
				InvocationType="RequestResponse",
				Payload=json.dumps(payload).encode("utf-8"),
				)

				body = json.load(res["Payload"])
				for message in body:
				print("remote: %s" % message)


				def generate_bundle(rev="."):
				"""Generate a bundle suitable for use by the Try service.

				Returns a tuple of revision metadata and raw Mercurial bundle data.
				"""
				# `hg bundle` doesn't support streaming to stdout. So we use a temporary
				# file.
				path = None
				try:
				fd, path = tempfile.mkstemp(prefix="hg-bundle-", suffix=".hg")
				os.close(fd)

				args = [
				"hg",
				"bundle",
				"--type",
				"gzip-v2",
				"--base",
				"public()",
				"--rev",
				rev,
				path,
				]

				print("generating bundle...")
				subprocess.run(args, check=True)

				with open(path, "rb") as fh:
				bundle_data = fh.read()

				finally:
				if path:
				os.unlink(path)

				args = [
				"hg",
				"log",
				"-r",
				rev,
				# We have to upload as JSON, so it won't matter if we emit binary
				# since we need to normalize to UTF-8.
				"-T",
				"json",
				]
				res = subprocess.run(args, check=True, capture_output=True)
				return json.loads(res.stdout)[0], bundle_data