upstream/mercurial-mirror Files · mercurial/lsprof.py

obsolete: order of magnitude speedup in _computebumpedset...

obsolete: order of magnitude speedup in _computebumpedset Reminder: a changeset is said "bumped" if it tries to obsolete a immutable changeset. The previous algorithm for computing bumped changeset was: 1) Get all public changesets 2) Find all they successors 3) Search for stuff that are eligible for being "bumped" (mutable and non obsolete) The entry size of this algorithm is `O(len(public))` which is mostly the same as `O(len(repo))`. Even this this approach mean fewer obsolescence marker are traveled, this is not very scalable. The new algorithm is: 1) For each potential bumped changesets (non obsolete mutable) 2) iterate over precursors 3) if a precursors is public. changeset is bumped We travel more obsolescence marker, but the entry size is much smaller since the amount of potential bumped should remains mostly stable with time `O(1)`. On some confidential gigantic repo this move bumped computation from 15.19s to 0.46s (×33 speedup…). On "smaller" repo (mercurial, cubicweb's review) no significant gain were seen. The additional traversal of obsolescence marker is probably probably counter balance the advantage of it. Other optimisation could be done in the future (eg: sharing precursors cache for divergence detection)

Mads Kiilerich - - Load All Authors

File last commit:

r18642:a40d608e default


                r20207:cd62532c

default

Download file

             lsprof.py
        
                    109 lines
            
             | 3.6 KiB
            
                | text/x-python
            
             |
                PythonLexer
            
             / mercurial / lsprof.py
          
                    History
                
                 |
                  Annotation
                 | Raw
                 |Copy content
                 |Copy permalink

      import sys

      from _lsprof import Profiler, profiler_entry

      __all__ = ['profile', 'Stats']

      def profile(f, *args, **kwds):

          """XXX docstring"""

          p = Profiler()

          p.enable(subcalls=True, builtins=True)

          try:

              f(*args, **kwds)

          finally:

              p.disable()

          return Stats(p.getstats())

      class Stats(object):

          """XXX docstring"""

          def __init__(self, data):

              self.data = data

          def sort(self, crit="inlinetime"):

              """XXX docstring"""

              if crit not in profiler_entry.__dict__:

                  raise ValueError("Can't sort by %s" % crit)

              self.data.sort(key=lambda x: getattr(x, crit), reverse=True)

              for e in self.data:

                  if e.calls:

                      e.calls.sort(key=lambda x: getattr(x, crit), reverse=True)

          def pprint(self, top=None, file=None, limit=None, climit=None):

              """XXX docstring"""

              if file is None:

                  file = sys.stdout

              d = self.data

              if top is not None:

                  d = d[:top]

              cols = "% 12s %12s %11.4f %11.4f   %s\n"

              hcols = "% 12s %12s %12s %12s %s\n"

              file.write(hcols % ("CallCount", "Recursive", "Total(s)",

                                  "Inline(s)", "module:lineno(function)"))

              count = 0

              for e in d:

                  file.write(cols % (e.callcount, e.reccallcount, e.totaltime,

                                     e.inlinetime, label(e.code)))

                  count += 1

                  if limit is not None and count == limit:

                      return

                  ccount = 0

                  if climit and e.calls:

                      for se in e.calls:

                          file.write(cols % (se.callcount, se.reccallcount,

                                             se.totaltime, se.inlinetime,

                                             "    %s" % label(se.code)))

                          count += 1

                          ccount += 1

                          if limit is not None and count == limit:

                              return

                          if climit is not None and ccount == climit:

                              break

          def freeze(self):

              """Replace all references to code objects with string

              descriptions; this makes it possible to pickle the instance."""

              # this code is probably rather ickier than it needs to be!

              for i in range(len(self.data)):

                  e = self.data[i]

                  if not isinstance(e.code, str):

                      self.data[i] = type(e)((label(e.code),) + e[1:])

                  if e.calls:

                      for j in range(len(e.calls)):

                          se = e.calls[j]

                          if not isinstance(se.code, str):

                              e.calls[j] = type(se)((label(se.code),) + se[1:])

      _fn2mod = {}

      def label(code):

          if isinstance(code, str):

              return code

          try:

              mname = _fn2mod[code.co_filename]

          except KeyError:

              for k, v in list(sys.modules.iteritems()):

                  if v is None:

                      continue

                  if not isinstance(getattr(v, '__file__', None), str):

                      continue

                  if v.__file__.startswith(code.co_filename):

                      mname = _fn2mod[code.co_filename] = k

                      break

              else:

                  mname = _fn2mod[code.co_filename] = '<%s>' % code.co_filename

          return '%s:%d(%s)' % (mname, code.co_firstlineno, code.co_name)

      if __name__ == '__main__':

          import os

          sys.argv = sys.argv[1:]

          if not sys.argv:

              print >> sys.stderr, "usage: lsprof.py <script> <arguments...>"

              sys.exit(2)

          sys.path.insert(0, os.path.abspath(os.path.dirname(sys.argv[0])))

          stats = profile(execfile, sys.argv[0], globals(), locals())

          stats.sort()

          stats.pprint()

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

				import sys
				from _lsprof import Profiler, profiler_entry

				__all__ = ['profile', 'Stats']

				def profile(f, args, *kwds):
				"""XXX docstring"""
				p = Profiler()
				p.enable(subcalls=True, builtins=True)
				try:
				f(args, *kwds)
				finally:
				p.disable()
				return Stats(p.getstats())


				class Stats(object):
				"""XXX docstring"""

				def __init__(self, data):
				self.data = data

				def sort(self, crit="inlinetime"):
				"""XXX docstring"""
				if crit not in profiler_entry.__dict__:
				raise ValueError("Can't sort by %s" % crit)
				self.data.sort(key=lambda x: getattr(x, crit), reverse=True)
				for e in self.data:
				if e.calls:
				e.calls.sort(key=lambda x: getattr(x, crit), reverse=True)

				def pprint(self, top=None, file=None, limit=None, climit=None):
				"""XXX docstring"""
				if file is None:
				file = sys.stdout
				d = self.data
				if top is not None:
				d = d[:top]
				cols = "% 12s %12s %11.4f %11.4f %s\n"
				hcols = "% 12s %12s %12s %12s %s\n"
				file.write(hcols % ("CallCount", "Recursive", "Total(s)",
				"Inline(s)", "module:lineno(function)"))
				count = 0
				for e in d:
				file.write(cols % (e.callcount, e.reccallcount, e.totaltime,
				e.inlinetime, label(e.code)))
				count += 1
				if limit is not None and count == limit:
				return
				ccount = 0
				if climit and e.calls:
				for se in e.calls:
				file.write(cols % (se.callcount, se.reccallcount,
				se.totaltime, se.inlinetime,
				" %s" % label(se.code)))
				count += 1
				ccount += 1
				if limit is not None and count == limit:
				return
				if climit is not None and ccount == climit:
				break

				def freeze(self):
				"""Replace all references to code objects with string
				descriptions; this makes it possible to pickle the instance."""

				# this code is probably rather ickier than it needs to be!
				for i in range(len(self.data)):
				e = self.data[i]
				if not isinstance(e.code, str):
				self.data[i] = type(e)((label(e.code),) + e[1:])
				if e.calls:
				for j in range(len(e.calls)):
				se = e.calls[j]
				if not isinstance(se.code, str):
				e.calls[j] = type(se)((label(se.code),) + se[1:])

				_fn2mod = {}

				def label(code):
				if isinstance(code, str):
				return code
				try:
				mname = _fn2mod[code.co_filename]
				except KeyError:
				for k, v in list(sys.modules.iteritems()):
				if v is None:
				continue
				if not isinstance(getattr(v, '__file__', None), str):
				continue
				if v.__file__.startswith(code.co_filename):
				mname = _fn2mod[code.co_filename] = k
				break
				else:
				mname = _fn2mod[code.co_filename] = '<%s>' % code.co_filename

				return '%s:%d(%s)' % (mname, code.co_firstlineno, code.co_name)


				if __name__ == '__main__':
				import os
				sys.argv = sys.argv[1:]
				if not sys.argv:
				print >> sys.stderr, "usage: lsprof.py <script> <arguments...>"
				sys.exit(2)
				sys.path.insert(0, os.path.abspath(os.path.dirname(sys.argv[0])))
				stats = profile(execfile, sys.argv[0], globals(), locals())
				stats.sort()
				stats.pprint()