upstream/kallithea Commit - r1338:bbfc3f30

Updated test_crawler to scan paths in more sensible order using ordered tuple.

marcink -

r1338:bbfc3f30 beta

parent child

rhodecode/tests/test_crawler.py

0 +20 -11

              # -*- coding: utf-8 -*-
              """
                  rhodecode.tests.test_crawer
                  ~~~~~~~~~~~~~~~~~~~~~~~~~~~
                  Test for crawling a project for memory usage
                  watch -n1 ./rhodecode/tests/mem_watch
                  :created_on: Apr 21, 2010
                  :author: marcink
                  :copyright: (C) 2009-2011 Marcin Kuzminski <marcin@python-works.com>
                  :license: GPLv3, see COPYING for more details.
              """
              # This program is free software: you can redistribute it and/or modify
              # it under the terms of the GNU General Public License as published by
              # the Free Software Foundation, either version 3 of the License, or
              # (at your option) any later version.
              #
              # This program is distributed in the hope that it will be useful,
              # but WITHOUT ANY WARRANTY; without even the implied warranty of
              # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
              # GNU General Public License for more details.
              #
              # You should have received a copy of the GNU General Public License
              # along with this program.  If not, see <http://www.gnu.org/licenses/>.
              import cookielib
              import urllib
              import urllib2
              import vcs
              import time
              from os.path import join as jn
              BASE_URI = 'http://127.0.0.1:5000/%s'
              PROJECT = 'CPython'
              PROJECT_PATH = jn('/', 'home', 'marcink', 'hg_repos')
              cj = cookielib.FileCookieJar('/tmp/rc_test_cookie.txt')
              o = urllib2.build_opener(urllib2.HTTPCookieProcessor(cj))
              o.addheaders = [
                                   ('User-agent', 'rhodecode-crawler'),
                                   ('Accept-Language', 'en - us, en;q = 0.5')
                                  ]
              urllib2.install_opener(o)
              def test_changelog_walk(pages=100):
                  total_time = 0
                  for i in range(1, pages):
                      page = '/'.join((PROJECT, 'changelog',))
                      full_uri = (BASE_URI % page) + '?' + urllib.urlencode({'page':i})
                      s = time.time()
                      f = o.open(full_uri)
                      size = len(f.read())
                      e = time.time() - s
                      total_time += e
                      print 'visited %s size:%s req:%s ms' % (full_uri, size, e)
                  print 'total_time', total_time
                  print 'average on req', total_time / float(pages)
-             def test_changeset_walk():
-                 print jn(PROJECT_PATH, PROJECT)
+             def test_changeset_walk(limit=None):
+                 print 'processing', jn(PROJECT_PATH, PROJECT)
                  total_time = 0
                  repo = vcs.get_repo(jn(PROJECT_PATH, PROJECT))
+                 cnt = 0
                  for i in repo:
+                     cnt += 1
                      raw_cs = '/'.join((PROJECT, 'changeset', i.raw_id))
+                     if limit and limit == cnt:
+                         break
                      full_uri = (BASE_URI % raw_cs)
                      s = time.time()
                      f = o.open(full_uri)
                      size = len(f.read())
                      e = time.time() - s
                      total_time += e
                      print 'visited %s\%s size:%s req:%s ms' % (full_uri, i, size, e)
                  print 'total_time', total_time
-                 print 'average on req', total_time / float(len(repo))
+                 print 'average on req', total_time / float(cnt)
              def test_files_walk():
-                 print jn(PROJECT_PATH, PROJECT)
+                 print 'processing', jn(PROJECT_PATH, PROJECT)
                  total_time = 0
                  repo = vcs.get_repo(jn(PROJECT_PATH, PROJECT))
-                 paths_ = set()
+                 from rhodecode.lib.oset import OrderedSet
+                 paths_ = OrderedSet([''])
                  try:
                      tip = repo.get_changeset('tip')
                      for topnode, dirs, files in tip.walk('/'):
-                         for f in files:
+                         for dir in dirs:
+                             paths_.add(dir.path)
+                             for f in dir:
                              paths_.add(f.path)
-                         for dir in dirs:
-                             for f in files:
-                                 paths_.add(f.path)
                  except vcs.exception.RepositoryError, e:
                      pass
                  for f in paths_:
                      file_path = '/'.join((PROJECT, 'files', 'tip', f))
                      full_uri = (BASE_URI % file_path)
                      s = time.time()
                      f = o.open(full_uri)
                      size = len(f.read())
                      e = time.time() - s
                      total_time += e
                      print 'visited %s size:%s req:%s ms' % (full_uri, size, e)
                  print 'total_time', total_time
                  print 'average on req', total_time / float(len(repo))
-             #test_changelog_walk()
-             #test_changeset_walk()
              test_files_walk()
+             test_changelog_walk(40)
+             test_changeset_walk(limit=100)

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages