##// END OF EJS Templates
git: use non-unicode author extraction as it's returned as bytes from backend, and we can...
marcink -
r825:dc8df3e0 stable
parent child Browse files
Show More
@@ -1,1177 +1,1181 b''
1 # RhodeCode VCSServer provides access to different vcs backends via network.
1 # RhodeCode VCSServer provides access to different vcs backends via network.
2 # Copyright (C) 2014-2019 RhodeCode GmbH
2 # Copyright (C) 2014-2019 RhodeCode GmbH
3 #
3 #
4 # This program is free software; you can redistribute it and/or modify
4 # This program is free software; you can redistribute it and/or modify
5 # it under the terms of the GNU General Public License as published by
5 # it under the terms of the GNU General Public License as published by
6 # the Free Software Foundation; either version 3 of the License, or
6 # the Free Software Foundation; either version 3 of the License, or
7 # (at your option) any later version.
7 # (at your option) any later version.
8 #
8 #
9 # This program is distributed in the hope that it will be useful,
9 # This program is distributed in the hope that it will be useful,
10 # but WITHOUT ANY WARRANTY; without even the implied warranty of
10 # but WITHOUT ANY WARRANTY; without even the implied warranty of
11 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
11 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 # GNU General Public License for more details.
12 # GNU General Public License for more details.
13 #
13 #
14 # You should have received a copy of the GNU General Public License
14 # You should have received a copy of the GNU General Public License
15 # along with this program; if not, write to the Free Software Foundation,
15 # along with this program; if not, write to the Free Software Foundation,
16 # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
16 # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
17
17
18 import collections
18 import collections
19 import logging
19 import logging
20 import os
20 import os
21 import posixpath as vcspath
21 import posixpath as vcspath
22 import re
22 import re
23 import stat
23 import stat
24 import traceback
24 import traceback
25 import urllib
25 import urllib
26 import urllib2
26 import urllib2
27 from functools import wraps
27 from functools import wraps
28
28
29 import more_itertools
29 import more_itertools
30 import pygit2
30 import pygit2
31 from pygit2 import Repository as LibGit2Repo
31 from pygit2 import Repository as LibGit2Repo
32 from dulwich import index, objects
32 from dulwich import index, objects
33 from dulwich.client import HttpGitClient, LocalGitClient
33 from dulwich.client import HttpGitClient, LocalGitClient
34 from dulwich.errors import (
34 from dulwich.errors import (
35 NotGitRepository, ChecksumMismatch, WrongObjectException,
35 NotGitRepository, ChecksumMismatch, WrongObjectException,
36 MissingCommitError, ObjectMissing, HangupException,
36 MissingCommitError, ObjectMissing, HangupException,
37 UnexpectedCommandError)
37 UnexpectedCommandError)
38 from dulwich.repo import Repo as DulwichRepo
38 from dulwich.repo import Repo as DulwichRepo
39 from dulwich.server import update_server_info
39 from dulwich.server import update_server_info
40
40
41 from vcsserver import exceptions, settings, subprocessio
41 from vcsserver import exceptions, settings, subprocessio
42 from vcsserver.utils import safe_str, safe_int
42 from vcsserver.utils import safe_str, safe_int, safe_unicode
43 from vcsserver.base import RepoFactory, obfuscate_qs
43 from vcsserver.base import RepoFactory, obfuscate_qs
44 from vcsserver.hgcompat import (
44 from vcsserver.hgcompat import (
45 hg_url as url_parser, httpbasicauthhandler, httpdigestauthhandler)
45 hg_url as url_parser, httpbasicauthhandler, httpdigestauthhandler)
46 from vcsserver.git_lfs.lib import LFSOidStore
46 from vcsserver.git_lfs.lib import LFSOidStore
47 from vcsserver.vcs_base import RemoteBase
47 from vcsserver.vcs_base import RemoteBase
48
48
49 DIR_STAT = stat.S_IFDIR
49 DIR_STAT = stat.S_IFDIR
50 FILE_MODE = stat.S_IFMT
50 FILE_MODE = stat.S_IFMT
51 GIT_LINK = objects.S_IFGITLINK
51 GIT_LINK = objects.S_IFGITLINK
52 PEELED_REF_MARKER = '^{}'
52 PEELED_REF_MARKER = '^{}'
53
53
54
54
55 log = logging.getLogger(__name__)
55 log = logging.getLogger(__name__)
56
56
57
57
58 def str_to_dulwich(value):
58 def str_to_dulwich(value):
59 """
59 """
60 Dulwich 0.10.1a requires `unicode` objects to be passed in.
60 Dulwich 0.10.1a requires `unicode` objects to be passed in.
61 """
61 """
62 return value.decode(settings.WIRE_ENCODING)
62 return value.decode(settings.WIRE_ENCODING)
63
63
64
64
65 def reraise_safe_exceptions(func):
65 def reraise_safe_exceptions(func):
66 """Converts Dulwich exceptions to something neutral."""
66 """Converts Dulwich exceptions to something neutral."""
67
67
68 @wraps(func)
68 @wraps(func)
69 def wrapper(*args, **kwargs):
69 def wrapper(*args, **kwargs):
70 try:
70 try:
71 return func(*args, **kwargs)
71 return func(*args, **kwargs)
72 except (ChecksumMismatch, WrongObjectException, MissingCommitError, ObjectMissing,) as e:
72 except (ChecksumMismatch, WrongObjectException, MissingCommitError, ObjectMissing,) as e:
73 exc = exceptions.LookupException(org_exc=e)
73 exc = exceptions.LookupException(org_exc=e)
74 raise exc(safe_str(e))
74 raise exc(safe_str(e))
75 except (HangupException, UnexpectedCommandError) as e:
75 except (HangupException, UnexpectedCommandError) as e:
76 exc = exceptions.VcsException(org_exc=e)
76 exc = exceptions.VcsException(org_exc=e)
77 raise exc(safe_str(e))
77 raise exc(safe_str(e))
78 except Exception as e:
78 except Exception as e:
79 # NOTE(marcink): becuase of how dulwich handles some exceptions
79 # NOTE(marcink): becuase of how dulwich handles some exceptions
80 # (KeyError on empty repos), we cannot track this and catch all
80 # (KeyError on empty repos), we cannot track this and catch all
81 # exceptions, it's an exceptions from other handlers
81 # exceptions, it's an exceptions from other handlers
82 #if not hasattr(e, '_vcs_kind'):
82 #if not hasattr(e, '_vcs_kind'):
83 #log.exception("Unhandled exception in git remote call")
83 #log.exception("Unhandled exception in git remote call")
84 #raise_from_original(exceptions.UnhandledException)
84 #raise_from_original(exceptions.UnhandledException)
85 raise
85 raise
86 return wrapper
86 return wrapper
87
87
88
88
89 class Repo(DulwichRepo):
89 class Repo(DulwichRepo):
90 """
90 """
91 A wrapper for dulwich Repo class.
91 A wrapper for dulwich Repo class.
92
92
93 Since dulwich is sometimes keeping .idx file descriptors open, it leads to
93 Since dulwich is sometimes keeping .idx file descriptors open, it leads to
94 "Too many open files" error. We need to close all opened file descriptors
94 "Too many open files" error. We need to close all opened file descriptors
95 once the repo object is destroyed.
95 once the repo object is destroyed.
96 """
96 """
97 def __del__(self):
97 def __del__(self):
98 if hasattr(self, 'object_store'):
98 if hasattr(self, 'object_store'):
99 self.close()
99 self.close()
100
100
101
101
102 class Repository(LibGit2Repo):
102 class Repository(LibGit2Repo):
103
103
104 def __enter__(self):
104 def __enter__(self):
105 return self
105 return self
106
106
107 def __exit__(self, exc_type, exc_val, exc_tb):
107 def __exit__(self, exc_type, exc_val, exc_tb):
108 self.free()
108 self.free()
109
109
110
110
111 class GitFactory(RepoFactory):
111 class GitFactory(RepoFactory):
112 repo_type = 'git'
112 repo_type = 'git'
113
113
114 def _create_repo(self, wire, create, use_libgit2=False):
114 def _create_repo(self, wire, create, use_libgit2=False):
115 if use_libgit2:
115 if use_libgit2:
116 return Repository(wire['path'])
116 return Repository(wire['path'])
117 else:
117 else:
118 repo_path = str_to_dulwich(wire['path'])
118 repo_path = str_to_dulwich(wire['path'])
119 return Repo(repo_path)
119 return Repo(repo_path)
120
120
121 def repo(self, wire, create=False, use_libgit2=False):
121 def repo(self, wire, create=False, use_libgit2=False):
122 """
122 """
123 Get a repository instance for the given path.
123 Get a repository instance for the given path.
124 """
124 """
125 return self._create_repo(wire, create, use_libgit2)
125 return self._create_repo(wire, create, use_libgit2)
126
126
127 def repo_libgit2(self, wire):
127 def repo_libgit2(self, wire):
128 return self.repo(wire, use_libgit2=True)
128 return self.repo(wire, use_libgit2=True)
129
129
130
130
131 class GitRemote(RemoteBase):
131 class GitRemote(RemoteBase):
132
132
133 def __init__(self, factory):
133 def __init__(self, factory):
134 self._factory = factory
134 self._factory = factory
135 self._bulk_methods = {
135 self._bulk_methods = {
136 "date": self.date,
136 "date": self.date,
137 "author": self.author,
137 "author": self.author,
138 "branch": self.branch,
138 "branch": self.branch,
139 "message": self.message,
139 "message": self.message,
140 "parents": self.parents,
140 "parents": self.parents,
141 "_commit": self.revision,
141 "_commit": self.revision,
142 }
142 }
143
143
144 def _wire_to_config(self, wire):
144 def _wire_to_config(self, wire):
145 if 'config' in wire:
145 if 'config' in wire:
146 return dict([(x[0] + '_' + x[1], x[2]) for x in wire['config']])
146 return dict([(x[0] + '_' + x[1], x[2]) for x in wire['config']])
147 return {}
147 return {}
148
148
149 def _remote_conf(self, config):
149 def _remote_conf(self, config):
150 params = [
150 params = [
151 '-c', 'core.askpass=""',
151 '-c', 'core.askpass=""',
152 ]
152 ]
153 ssl_cert_dir = config.get('vcs_ssl_dir')
153 ssl_cert_dir = config.get('vcs_ssl_dir')
154 if ssl_cert_dir:
154 if ssl_cert_dir:
155 params.extend(['-c', 'http.sslCAinfo={}'.format(ssl_cert_dir)])
155 params.extend(['-c', 'http.sslCAinfo={}'.format(ssl_cert_dir)])
156 return params
156 return params
157
157
158 @reraise_safe_exceptions
158 @reraise_safe_exceptions
159 def discover_git_version(self):
159 def discover_git_version(self):
160 stdout, _ = self.run_git_command(
160 stdout, _ = self.run_git_command(
161 {}, ['--version'], _bare=True, _safe=True)
161 {}, ['--version'], _bare=True, _safe=True)
162 prefix = 'git version'
162 prefix = 'git version'
163 if stdout.startswith(prefix):
163 if stdout.startswith(prefix):
164 stdout = stdout[len(prefix):]
164 stdout = stdout[len(prefix):]
165 return stdout.strip()
165 return stdout.strip()
166
166
167 @reraise_safe_exceptions
167 @reraise_safe_exceptions
168 def is_empty(self, wire):
168 def is_empty(self, wire):
169 repo_init = self._factory.repo_libgit2(wire)
169 repo_init = self._factory.repo_libgit2(wire)
170 with repo_init as repo:
170 with repo_init as repo:
171
171
172 try:
172 try:
173 has_head = repo.head.name
173 has_head = repo.head.name
174 if has_head:
174 if has_head:
175 return False
175 return False
176
176
177 # NOTE(marcink): check again using more expensive method
177 # NOTE(marcink): check again using more expensive method
178 return repo.is_empty
178 return repo.is_empty
179 except Exception:
179 except Exception:
180 pass
180 pass
181
181
182 return True
182 return True
183
183
184 @reraise_safe_exceptions
184 @reraise_safe_exceptions
185 def assert_correct_path(self, wire):
185 def assert_correct_path(self, wire):
186 cache_on, context_uid, repo_id = self._cache_on(wire)
186 cache_on, context_uid, repo_id = self._cache_on(wire)
187 @self.region.conditional_cache_on_arguments(condition=cache_on)
187 @self.region.conditional_cache_on_arguments(condition=cache_on)
188 def _assert_correct_path(_context_uid, _repo_id):
188 def _assert_correct_path(_context_uid, _repo_id):
189 try:
189 try:
190 repo_init = self._factory.repo_libgit2(wire)
190 repo_init = self._factory.repo_libgit2(wire)
191 with repo_init as repo:
191 with repo_init as repo:
192 pass
192 pass
193 except pygit2.GitError:
193 except pygit2.GitError:
194 path = wire.get('path')
194 path = wire.get('path')
195 tb = traceback.format_exc()
195 tb = traceback.format_exc()
196 log.debug("Invalid Git path `%s`, tb: %s", path, tb)
196 log.debug("Invalid Git path `%s`, tb: %s", path, tb)
197 return False
197 return False
198
198
199 return True
199 return True
200 return _assert_correct_path(context_uid, repo_id)
200 return _assert_correct_path(context_uid, repo_id)
201
201
202 @reraise_safe_exceptions
202 @reraise_safe_exceptions
203 def bare(self, wire):
203 def bare(self, wire):
204 repo_init = self._factory.repo_libgit2(wire)
204 repo_init = self._factory.repo_libgit2(wire)
205 with repo_init as repo:
205 with repo_init as repo:
206 return repo.is_bare
206 return repo.is_bare
207
207
208 @reraise_safe_exceptions
208 @reraise_safe_exceptions
209 def blob_as_pretty_string(self, wire, sha):
209 def blob_as_pretty_string(self, wire, sha):
210 repo_init = self._factory.repo_libgit2(wire)
210 repo_init = self._factory.repo_libgit2(wire)
211 with repo_init as repo:
211 with repo_init as repo:
212 blob_obj = repo[sha]
212 blob_obj = repo[sha]
213 blob = blob_obj.data
213 blob = blob_obj.data
214 return blob
214 return blob
215
215
216 @reraise_safe_exceptions
216 @reraise_safe_exceptions
217 def blob_raw_length(self, wire, sha):
217 def blob_raw_length(self, wire, sha):
218 cache_on, context_uid, repo_id = self._cache_on(wire)
218 cache_on, context_uid, repo_id = self._cache_on(wire)
219 @self.region.conditional_cache_on_arguments(condition=cache_on)
219 @self.region.conditional_cache_on_arguments(condition=cache_on)
220 def _blob_raw_length(_repo_id, _sha):
220 def _blob_raw_length(_repo_id, _sha):
221
221
222 repo_init = self._factory.repo_libgit2(wire)
222 repo_init = self._factory.repo_libgit2(wire)
223 with repo_init as repo:
223 with repo_init as repo:
224 blob = repo[sha]
224 blob = repo[sha]
225 return blob.size
225 return blob.size
226
226
227 return _blob_raw_length(repo_id, sha)
227 return _blob_raw_length(repo_id, sha)
228
228
229 def _parse_lfs_pointer(self, raw_content):
229 def _parse_lfs_pointer(self, raw_content):
230
230
231 spec_string = 'version https://git-lfs.github.com/spec'
231 spec_string = 'version https://git-lfs.github.com/spec'
232 if raw_content and raw_content.startswith(spec_string):
232 if raw_content and raw_content.startswith(spec_string):
233 pattern = re.compile(r"""
233 pattern = re.compile(r"""
234 (?:\n)?
234 (?:\n)?
235 ^version[ ]https://git-lfs\.github\.com/spec/(?P<spec_ver>v\d+)\n
235 ^version[ ]https://git-lfs\.github\.com/spec/(?P<spec_ver>v\d+)\n
236 ^oid[ ] sha256:(?P<oid_hash>[0-9a-f]{64})\n
236 ^oid[ ] sha256:(?P<oid_hash>[0-9a-f]{64})\n
237 ^size[ ](?P<oid_size>[0-9]+)\n
237 ^size[ ](?P<oid_size>[0-9]+)\n
238 (?:\n)?
238 (?:\n)?
239 """, re.VERBOSE | re.MULTILINE)
239 """, re.VERBOSE | re.MULTILINE)
240 match = pattern.match(raw_content)
240 match = pattern.match(raw_content)
241 if match:
241 if match:
242 return match.groupdict()
242 return match.groupdict()
243
243
244 return {}
244 return {}
245
245
246 @reraise_safe_exceptions
246 @reraise_safe_exceptions
247 def is_large_file(self, wire, commit_id):
247 def is_large_file(self, wire, commit_id):
248 cache_on, context_uid, repo_id = self._cache_on(wire)
248 cache_on, context_uid, repo_id = self._cache_on(wire)
249
249
250 @self.region.conditional_cache_on_arguments(condition=cache_on)
250 @self.region.conditional_cache_on_arguments(condition=cache_on)
251 def _is_large_file(_repo_id, _sha):
251 def _is_large_file(_repo_id, _sha):
252 repo_init = self._factory.repo_libgit2(wire)
252 repo_init = self._factory.repo_libgit2(wire)
253 with repo_init as repo:
253 with repo_init as repo:
254 blob = repo[commit_id]
254 blob = repo[commit_id]
255 if blob.is_binary:
255 if blob.is_binary:
256 return {}
256 return {}
257
257
258 return self._parse_lfs_pointer(blob.data)
258 return self._parse_lfs_pointer(blob.data)
259
259
260 return _is_large_file(repo_id, commit_id)
260 return _is_large_file(repo_id, commit_id)
261
261
262 @reraise_safe_exceptions
262 @reraise_safe_exceptions
263 def is_binary(self, wire, tree_id):
263 def is_binary(self, wire, tree_id):
264 cache_on, context_uid, repo_id = self._cache_on(wire)
264 cache_on, context_uid, repo_id = self._cache_on(wire)
265
265
266 @self.region.conditional_cache_on_arguments(condition=cache_on)
266 @self.region.conditional_cache_on_arguments(condition=cache_on)
267 def _is_binary(_repo_id, _tree_id):
267 def _is_binary(_repo_id, _tree_id):
268 repo_init = self._factory.repo_libgit2(wire)
268 repo_init = self._factory.repo_libgit2(wire)
269 with repo_init as repo:
269 with repo_init as repo:
270 blob_obj = repo[tree_id]
270 blob_obj = repo[tree_id]
271 return blob_obj.is_binary
271 return blob_obj.is_binary
272
272
273 return _is_binary(repo_id, tree_id)
273 return _is_binary(repo_id, tree_id)
274
274
275 @reraise_safe_exceptions
275 @reraise_safe_exceptions
276 def in_largefiles_store(self, wire, oid):
276 def in_largefiles_store(self, wire, oid):
277 conf = self._wire_to_config(wire)
277 conf = self._wire_to_config(wire)
278 repo_init = self._factory.repo_libgit2(wire)
278 repo_init = self._factory.repo_libgit2(wire)
279 with repo_init as repo:
279 with repo_init as repo:
280 repo_name = repo.path
280 repo_name = repo.path
281
281
282 store_location = conf.get('vcs_git_lfs_store_location')
282 store_location = conf.get('vcs_git_lfs_store_location')
283 if store_location:
283 if store_location:
284
284
285 store = LFSOidStore(
285 store = LFSOidStore(
286 oid=oid, repo=repo_name, store_location=store_location)
286 oid=oid, repo=repo_name, store_location=store_location)
287 return store.has_oid()
287 return store.has_oid()
288
288
289 return False
289 return False
290
290
291 @reraise_safe_exceptions
291 @reraise_safe_exceptions
292 def store_path(self, wire, oid):
292 def store_path(self, wire, oid):
293 conf = self._wire_to_config(wire)
293 conf = self._wire_to_config(wire)
294 repo_init = self._factory.repo_libgit2(wire)
294 repo_init = self._factory.repo_libgit2(wire)
295 with repo_init as repo:
295 with repo_init as repo:
296 repo_name = repo.path
296 repo_name = repo.path
297
297
298 store_location = conf.get('vcs_git_lfs_store_location')
298 store_location = conf.get('vcs_git_lfs_store_location')
299 if store_location:
299 if store_location:
300 store = LFSOidStore(
300 store = LFSOidStore(
301 oid=oid, repo=repo_name, store_location=store_location)
301 oid=oid, repo=repo_name, store_location=store_location)
302 return store.oid_path
302 return store.oid_path
303 raise ValueError('Unable to fetch oid with path {}'.format(oid))
303 raise ValueError('Unable to fetch oid with path {}'.format(oid))
304
304
305 @reraise_safe_exceptions
305 @reraise_safe_exceptions
306 def bulk_request(self, wire, rev, pre_load):
306 def bulk_request(self, wire, rev, pre_load):
307 cache_on, context_uid, repo_id = self._cache_on(wire)
307 cache_on, context_uid, repo_id = self._cache_on(wire)
308 @self.region.conditional_cache_on_arguments(condition=cache_on)
308 @self.region.conditional_cache_on_arguments(condition=cache_on)
309 def _bulk_request(_repo_id, _rev, _pre_load):
309 def _bulk_request(_repo_id, _rev, _pre_load):
310 result = {}
310 result = {}
311 for attr in pre_load:
311 for attr in pre_load:
312 try:
312 try:
313 method = self._bulk_methods[attr]
313 method = self._bulk_methods[attr]
314 args = [wire, rev]
314 args = [wire, rev]
315 result[attr] = method(*args)
315 result[attr] = method(*args)
316 except KeyError as e:
316 except KeyError as e:
317 raise exceptions.VcsException(e)(
317 raise exceptions.VcsException(e)(
318 "Unknown bulk attribute: %s" % attr)
318 "Unknown bulk attribute: %s" % attr)
319 return result
319 return result
320
320
321 return _bulk_request(repo_id, rev, sorted(pre_load))
321 return _bulk_request(repo_id, rev, sorted(pre_load))
322
322
323 def _build_opener(self, url):
323 def _build_opener(self, url):
324 handlers = []
324 handlers = []
325 url_obj = url_parser(url)
325 url_obj = url_parser(url)
326 _, authinfo = url_obj.authinfo()
326 _, authinfo = url_obj.authinfo()
327
327
328 if authinfo:
328 if authinfo:
329 # create a password manager
329 # create a password manager
330 passmgr = urllib2.HTTPPasswordMgrWithDefaultRealm()
330 passmgr = urllib2.HTTPPasswordMgrWithDefaultRealm()
331 passmgr.add_password(*authinfo)
331 passmgr.add_password(*authinfo)
332
332
333 handlers.extend((httpbasicauthhandler(passmgr),
333 handlers.extend((httpbasicauthhandler(passmgr),
334 httpdigestauthhandler(passmgr)))
334 httpdigestauthhandler(passmgr)))
335
335
336 return urllib2.build_opener(*handlers)
336 return urllib2.build_opener(*handlers)
337
337
338 def _type_id_to_name(self, type_id):
338 def _type_id_to_name(self, type_id):
339 return {
339 return {
340 1: b'commit',
340 1: b'commit',
341 2: b'tree',
341 2: b'tree',
342 3: b'blob',
342 3: b'blob',
343 4: b'tag'
343 4: b'tag'
344 }[type_id]
344 }[type_id]
345
345
346 @reraise_safe_exceptions
346 @reraise_safe_exceptions
347 def check_url(self, url, config):
347 def check_url(self, url, config):
348 url_obj = url_parser(url)
348 url_obj = url_parser(url)
349 test_uri, _ = url_obj.authinfo()
349 test_uri, _ = url_obj.authinfo()
350 url_obj.passwd = '*****' if url_obj.passwd else url_obj.passwd
350 url_obj.passwd = '*****' if url_obj.passwd else url_obj.passwd
351 url_obj.query = obfuscate_qs(url_obj.query)
351 url_obj.query = obfuscate_qs(url_obj.query)
352 cleaned_uri = str(url_obj)
352 cleaned_uri = str(url_obj)
353 log.info("Checking URL for remote cloning/import: %s", cleaned_uri)
353 log.info("Checking URL for remote cloning/import: %s", cleaned_uri)
354
354
355 if not test_uri.endswith('info/refs'):
355 if not test_uri.endswith('info/refs'):
356 test_uri = test_uri.rstrip('/') + '/info/refs'
356 test_uri = test_uri.rstrip('/') + '/info/refs'
357
357
358 o = self._build_opener(url)
358 o = self._build_opener(url)
359 o.addheaders = [('User-Agent', 'git/1.7.8.0')] # fake some git
359 o.addheaders = [('User-Agent', 'git/1.7.8.0')] # fake some git
360
360
361 q = {"service": 'git-upload-pack'}
361 q = {"service": 'git-upload-pack'}
362 qs = '?%s' % urllib.urlencode(q)
362 qs = '?%s' % urllib.urlencode(q)
363 cu = "%s%s" % (test_uri, qs)
363 cu = "%s%s" % (test_uri, qs)
364 req = urllib2.Request(cu, None, {})
364 req = urllib2.Request(cu, None, {})
365
365
366 try:
366 try:
367 log.debug("Trying to open URL %s", cleaned_uri)
367 log.debug("Trying to open URL %s", cleaned_uri)
368 resp = o.open(req)
368 resp = o.open(req)
369 if resp.code != 200:
369 if resp.code != 200:
370 raise exceptions.URLError()('Return Code is not 200')
370 raise exceptions.URLError()('Return Code is not 200')
371 except Exception as e:
371 except Exception as e:
372 log.warning("URL cannot be opened: %s", cleaned_uri, exc_info=True)
372 log.warning("URL cannot be opened: %s", cleaned_uri, exc_info=True)
373 # means it cannot be cloned
373 # means it cannot be cloned
374 raise exceptions.URLError(e)("[%s] org_exc: %s" % (cleaned_uri, e))
374 raise exceptions.URLError(e)("[%s] org_exc: %s" % (cleaned_uri, e))
375
375
376 # now detect if it's proper git repo
376 # now detect if it's proper git repo
377 gitdata = resp.read()
377 gitdata = resp.read()
378 if 'service=git-upload-pack' in gitdata:
378 if 'service=git-upload-pack' in gitdata:
379 pass
379 pass
380 elif re.findall(r'[0-9a-fA-F]{40}\s+refs', gitdata):
380 elif re.findall(r'[0-9a-fA-F]{40}\s+refs', gitdata):
381 # old style git can return some other format !
381 # old style git can return some other format !
382 pass
382 pass
383 else:
383 else:
384 raise exceptions.URLError()(
384 raise exceptions.URLError()(
385 "url [%s] does not look like an git" % (cleaned_uri,))
385 "url [%s] does not look like an git" % (cleaned_uri,))
386
386
387 return True
387 return True
388
388
389 @reraise_safe_exceptions
389 @reraise_safe_exceptions
390 def clone(self, wire, url, deferred, valid_refs, update_after_clone):
390 def clone(self, wire, url, deferred, valid_refs, update_after_clone):
391 # TODO(marcink): deprecate this method. Last i checked we don't use it anymore
391 # TODO(marcink): deprecate this method. Last i checked we don't use it anymore
392 remote_refs = self.pull(wire, url, apply_refs=False)
392 remote_refs = self.pull(wire, url, apply_refs=False)
393 repo = self._factory.repo(wire)
393 repo = self._factory.repo(wire)
394 if isinstance(valid_refs, list):
394 if isinstance(valid_refs, list):
395 valid_refs = tuple(valid_refs)
395 valid_refs = tuple(valid_refs)
396
396
397 for k in remote_refs:
397 for k in remote_refs:
398 # only parse heads/tags and skip so called deferred tags
398 # only parse heads/tags and skip so called deferred tags
399 if k.startswith(valid_refs) and not k.endswith(deferred):
399 if k.startswith(valid_refs) and not k.endswith(deferred):
400 repo[k] = remote_refs[k]
400 repo[k] = remote_refs[k]
401
401
402 if update_after_clone:
402 if update_after_clone:
403 # we want to checkout HEAD
403 # we want to checkout HEAD
404 repo["HEAD"] = remote_refs["HEAD"]
404 repo["HEAD"] = remote_refs["HEAD"]
405 index.build_index_from_tree(repo.path, repo.index_path(),
405 index.build_index_from_tree(repo.path, repo.index_path(),
406 repo.object_store, repo["HEAD"].tree)
406 repo.object_store, repo["HEAD"].tree)
407
407
408 @reraise_safe_exceptions
408 @reraise_safe_exceptions
409 def branch(self, wire, commit_id):
409 def branch(self, wire, commit_id):
410 cache_on, context_uid, repo_id = self._cache_on(wire)
410 cache_on, context_uid, repo_id = self._cache_on(wire)
411 @self.region.conditional_cache_on_arguments(condition=cache_on)
411 @self.region.conditional_cache_on_arguments(condition=cache_on)
412 def _branch(_context_uid, _repo_id, _commit_id):
412 def _branch(_context_uid, _repo_id, _commit_id):
413 regex = re.compile('^refs/heads')
413 regex = re.compile('^refs/heads')
414
414
415 def filter_with(ref):
415 def filter_with(ref):
416 return regex.match(ref[0]) and ref[1] == _commit_id
416 return regex.match(ref[0]) and ref[1] == _commit_id
417
417
418 branches = filter(filter_with, self.get_refs(wire).items())
418 branches = filter(filter_with, self.get_refs(wire).items())
419 return [x[0].split('refs/heads/')[-1] for x in branches]
419 return [x[0].split('refs/heads/')[-1] for x in branches]
420
420
421 return _branch(context_uid, repo_id, commit_id)
421 return _branch(context_uid, repo_id, commit_id)
422
422
423 @reraise_safe_exceptions
423 @reraise_safe_exceptions
424 def commit_branches(self, wire, commit_id):
424 def commit_branches(self, wire, commit_id):
425 cache_on, context_uid, repo_id = self._cache_on(wire)
425 cache_on, context_uid, repo_id = self._cache_on(wire)
426 @self.region.conditional_cache_on_arguments(condition=cache_on)
426 @self.region.conditional_cache_on_arguments(condition=cache_on)
427 def _commit_branches(_context_uid, _repo_id, _commit_id):
427 def _commit_branches(_context_uid, _repo_id, _commit_id):
428 repo_init = self._factory.repo_libgit2(wire)
428 repo_init = self._factory.repo_libgit2(wire)
429 with repo_init as repo:
429 with repo_init as repo:
430 branches = [x for x in repo.branches.with_commit(_commit_id)]
430 branches = [x for x in repo.branches.with_commit(_commit_id)]
431 return branches
431 return branches
432
432
433 return _commit_branches(context_uid, repo_id, commit_id)
433 return _commit_branches(context_uid, repo_id, commit_id)
434
434
435 @reraise_safe_exceptions
435 @reraise_safe_exceptions
436 def add_object(self, wire, content):
436 def add_object(self, wire, content):
437 repo_init = self._factory.repo_libgit2(wire)
437 repo_init = self._factory.repo_libgit2(wire)
438 with repo_init as repo:
438 with repo_init as repo:
439 blob = objects.Blob()
439 blob = objects.Blob()
440 blob.set_raw_string(content)
440 blob.set_raw_string(content)
441 repo.object_store.add_object(blob)
441 repo.object_store.add_object(blob)
442 return blob.id
442 return blob.id
443
443
444 # TODO: this is quite complex, check if that can be simplified
444 # TODO: this is quite complex, check if that can be simplified
445 @reraise_safe_exceptions
445 @reraise_safe_exceptions
446 def commit(self, wire, commit_data, branch, commit_tree, updated, removed):
446 def commit(self, wire, commit_data, branch, commit_tree, updated, removed):
447 repo = self._factory.repo(wire)
447 repo = self._factory.repo(wire)
448 object_store = repo.object_store
448 object_store = repo.object_store
449
449
450 # Create tree and populates it with blobs
450 # Create tree and populates it with blobs
451 commit_tree = commit_tree and repo[commit_tree] or objects.Tree()
451 commit_tree = commit_tree and repo[commit_tree] or objects.Tree()
452
452
453 for node in updated:
453 for node in updated:
454 # Compute subdirs if needed
454 # Compute subdirs if needed
455 dirpath, nodename = vcspath.split(node['path'])
455 dirpath, nodename = vcspath.split(node['path'])
456 dirnames = map(safe_str, dirpath and dirpath.split('/') or [])
456 dirnames = map(safe_str, dirpath and dirpath.split('/') or [])
457 parent = commit_tree
457 parent = commit_tree
458 ancestors = [('', parent)]
458 ancestors = [('', parent)]
459
459
460 # Tries to dig for the deepest existing tree
460 # Tries to dig for the deepest existing tree
461 while dirnames:
461 while dirnames:
462 curdir = dirnames.pop(0)
462 curdir = dirnames.pop(0)
463 try:
463 try:
464 dir_id = parent[curdir][1]
464 dir_id = parent[curdir][1]
465 except KeyError:
465 except KeyError:
466 # put curdir back into dirnames and stops
466 # put curdir back into dirnames and stops
467 dirnames.insert(0, curdir)
467 dirnames.insert(0, curdir)
468 break
468 break
469 else:
469 else:
470 # If found, updates parent
470 # If found, updates parent
471 parent = repo[dir_id]
471 parent = repo[dir_id]
472 ancestors.append((curdir, parent))
472 ancestors.append((curdir, parent))
473 # Now parent is deepest existing tree and we need to create
473 # Now parent is deepest existing tree and we need to create
474 # subtrees for dirnames (in reverse order)
474 # subtrees for dirnames (in reverse order)
475 # [this only applies for nodes from added]
475 # [this only applies for nodes from added]
476 new_trees = []
476 new_trees = []
477
477
478 blob = objects.Blob.from_string(node['content'])
478 blob = objects.Blob.from_string(node['content'])
479
479
480 if dirnames:
480 if dirnames:
481 # If there are trees which should be created we need to build
481 # If there are trees which should be created we need to build
482 # them now (in reverse order)
482 # them now (in reverse order)
483 reversed_dirnames = list(reversed(dirnames))
483 reversed_dirnames = list(reversed(dirnames))
484 curtree = objects.Tree()
484 curtree = objects.Tree()
485 curtree[node['node_path']] = node['mode'], blob.id
485 curtree[node['node_path']] = node['mode'], blob.id
486 new_trees.append(curtree)
486 new_trees.append(curtree)
487 for dirname in reversed_dirnames[:-1]:
487 for dirname in reversed_dirnames[:-1]:
488 newtree = objects.Tree()
488 newtree = objects.Tree()
489 newtree[dirname] = (DIR_STAT, curtree.id)
489 newtree[dirname] = (DIR_STAT, curtree.id)
490 new_trees.append(newtree)
490 new_trees.append(newtree)
491 curtree = newtree
491 curtree = newtree
492 parent[reversed_dirnames[-1]] = (DIR_STAT, curtree.id)
492 parent[reversed_dirnames[-1]] = (DIR_STAT, curtree.id)
493 else:
493 else:
494 parent.add(name=node['node_path'], mode=node['mode'], hexsha=blob.id)
494 parent.add(name=node['node_path'], mode=node['mode'], hexsha=blob.id)
495
495
496 new_trees.append(parent)
496 new_trees.append(parent)
497 # Update ancestors
497 # Update ancestors
498 reversed_ancestors = reversed(
498 reversed_ancestors = reversed(
499 [(a[1], b[1], b[0]) for a, b in zip(ancestors, ancestors[1:])])
499 [(a[1], b[1], b[0]) for a, b in zip(ancestors, ancestors[1:])])
500 for parent, tree, path in reversed_ancestors:
500 for parent, tree, path in reversed_ancestors:
501 parent[path] = (DIR_STAT, tree.id)
501 parent[path] = (DIR_STAT, tree.id)
502 object_store.add_object(tree)
502 object_store.add_object(tree)
503
503
504 object_store.add_object(blob)
504 object_store.add_object(blob)
505 for tree in new_trees:
505 for tree in new_trees:
506 object_store.add_object(tree)
506 object_store.add_object(tree)
507
507
508 for node_path in removed:
508 for node_path in removed:
509 paths = node_path.split('/')
509 paths = node_path.split('/')
510 tree = commit_tree
510 tree = commit_tree
511 trees = [tree]
511 trees = [tree]
512 # Traverse deep into the forest...
512 # Traverse deep into the forest...
513 for path in paths:
513 for path in paths:
514 try:
514 try:
515 obj = repo[tree[path][1]]
515 obj = repo[tree[path][1]]
516 if isinstance(obj, objects.Tree):
516 if isinstance(obj, objects.Tree):
517 trees.append(obj)
517 trees.append(obj)
518 tree = obj
518 tree = obj
519 except KeyError:
519 except KeyError:
520 break
520 break
521 # Cut down the blob and all rotten trees on the way back...
521 # Cut down the blob and all rotten trees on the way back...
522 for path, tree in reversed(zip(paths, trees)):
522 for path, tree in reversed(zip(paths, trees)):
523 del tree[path]
523 del tree[path]
524 if tree:
524 if tree:
525 # This tree still has elements - don't remove it or any
525 # This tree still has elements - don't remove it or any
526 # of it's parents
526 # of it's parents
527 break
527 break
528
528
529 object_store.add_object(commit_tree)
529 object_store.add_object(commit_tree)
530
530
531 # Create commit
531 # Create commit
532 commit = objects.Commit()
532 commit = objects.Commit()
533 commit.tree = commit_tree.id
533 commit.tree = commit_tree.id
534 for k, v in commit_data.iteritems():
534 for k, v in commit_data.iteritems():
535 setattr(commit, k, v)
535 setattr(commit, k, v)
536 object_store.add_object(commit)
536 object_store.add_object(commit)
537
537
538 self.create_branch(wire, branch, commit.id)
538 self.create_branch(wire, branch, commit.id)
539
539
540 # dulwich set-ref
540 # dulwich set-ref
541 ref = 'refs/heads/%s' % branch
541 ref = 'refs/heads/%s' % branch
542 repo.refs[ref] = commit.id
542 repo.refs[ref] = commit.id
543
543
544 return commit.id
544 return commit.id
545
545
546 @reraise_safe_exceptions
546 @reraise_safe_exceptions
547 def pull(self, wire, url, apply_refs=True, refs=None, update_after=False):
547 def pull(self, wire, url, apply_refs=True, refs=None, update_after=False):
548 if url != 'default' and '://' not in url:
548 if url != 'default' and '://' not in url:
549 client = LocalGitClient(url)
549 client = LocalGitClient(url)
550 else:
550 else:
551 url_obj = url_parser(url)
551 url_obj = url_parser(url)
552 o = self._build_opener(url)
552 o = self._build_opener(url)
553 url, _ = url_obj.authinfo()
553 url, _ = url_obj.authinfo()
554 client = HttpGitClient(base_url=url, opener=o)
554 client = HttpGitClient(base_url=url, opener=o)
555 repo = self._factory.repo(wire)
555 repo = self._factory.repo(wire)
556
556
557 determine_wants = repo.object_store.determine_wants_all
557 determine_wants = repo.object_store.determine_wants_all
558 if refs:
558 if refs:
559 def determine_wants_requested(references):
559 def determine_wants_requested(references):
560 return [references[r] for r in references if r in refs]
560 return [references[r] for r in references if r in refs]
561 determine_wants = determine_wants_requested
561 determine_wants = determine_wants_requested
562
562
563 try:
563 try:
564 remote_refs = client.fetch(
564 remote_refs = client.fetch(
565 path=url, target=repo, determine_wants=determine_wants)
565 path=url, target=repo, determine_wants=determine_wants)
566 except NotGitRepository as e:
566 except NotGitRepository as e:
567 log.warning(
567 log.warning(
568 'Trying to fetch from "%s" failed, not a Git repository.', url)
568 'Trying to fetch from "%s" failed, not a Git repository.', url)
569 # Exception can contain unicode which we convert
569 # Exception can contain unicode which we convert
570 raise exceptions.AbortException(e)(repr(e))
570 raise exceptions.AbortException(e)(repr(e))
571
571
572 # mikhail: client.fetch() returns all the remote refs, but fetches only
572 # mikhail: client.fetch() returns all the remote refs, but fetches only
573 # refs filtered by `determine_wants` function. We need to filter result
573 # refs filtered by `determine_wants` function. We need to filter result
574 # as well
574 # as well
575 if refs:
575 if refs:
576 remote_refs = {k: remote_refs[k] for k in remote_refs if k in refs}
576 remote_refs = {k: remote_refs[k] for k in remote_refs if k in refs}
577
577
578 if apply_refs:
578 if apply_refs:
579 # TODO: johbo: Needs proper test coverage with a git repository
579 # TODO: johbo: Needs proper test coverage with a git repository
580 # that contains a tag object, so that we would end up with
580 # that contains a tag object, so that we would end up with
581 # a peeled ref at this point.
581 # a peeled ref at this point.
582 for k in remote_refs:
582 for k in remote_refs:
583 if k.endswith(PEELED_REF_MARKER):
583 if k.endswith(PEELED_REF_MARKER):
584 log.debug("Skipping peeled reference %s", k)
584 log.debug("Skipping peeled reference %s", k)
585 continue
585 continue
586 repo[k] = remote_refs[k]
586 repo[k] = remote_refs[k]
587
587
588 if refs and not update_after:
588 if refs and not update_after:
589 # mikhail: explicitly set the head to the last ref.
589 # mikhail: explicitly set the head to the last ref.
590 repo['HEAD'] = remote_refs[refs[-1]]
590 repo['HEAD'] = remote_refs[refs[-1]]
591
591
592 if update_after:
592 if update_after:
593 # we want to checkout HEAD
593 # we want to checkout HEAD
594 repo["HEAD"] = remote_refs["HEAD"]
594 repo["HEAD"] = remote_refs["HEAD"]
595 index.build_index_from_tree(repo.path, repo.index_path(),
595 index.build_index_from_tree(repo.path, repo.index_path(),
596 repo.object_store, repo["HEAD"].tree)
596 repo.object_store, repo["HEAD"].tree)
597 return remote_refs
597 return remote_refs
598
598
599 @reraise_safe_exceptions
599 @reraise_safe_exceptions
600 def sync_fetch(self, wire, url, refs=None, all_refs=False):
600 def sync_fetch(self, wire, url, refs=None, all_refs=False):
601 repo = self._factory.repo(wire)
601 repo = self._factory.repo(wire)
602 if refs and not isinstance(refs, (list, tuple)):
602 if refs and not isinstance(refs, (list, tuple)):
603 refs = [refs]
603 refs = [refs]
604
604
605 config = self._wire_to_config(wire)
605 config = self._wire_to_config(wire)
606 # get all remote refs we'll use to fetch later
606 # get all remote refs we'll use to fetch later
607 cmd = ['ls-remote']
607 cmd = ['ls-remote']
608 if not all_refs:
608 if not all_refs:
609 cmd += ['--heads', '--tags']
609 cmd += ['--heads', '--tags']
610 cmd += [url]
610 cmd += [url]
611 output, __ = self.run_git_command(
611 output, __ = self.run_git_command(
612 wire, cmd, fail_on_stderr=False,
612 wire, cmd, fail_on_stderr=False,
613 _copts=self._remote_conf(config),
613 _copts=self._remote_conf(config),
614 extra_env={'GIT_TERMINAL_PROMPT': '0'})
614 extra_env={'GIT_TERMINAL_PROMPT': '0'})
615
615
616 remote_refs = collections.OrderedDict()
616 remote_refs = collections.OrderedDict()
617 fetch_refs = []
617 fetch_refs = []
618
618
619 for ref_line in output.splitlines():
619 for ref_line in output.splitlines():
620 sha, ref = ref_line.split('\t')
620 sha, ref = ref_line.split('\t')
621 sha = sha.strip()
621 sha = sha.strip()
622 if ref in remote_refs:
622 if ref in remote_refs:
623 # duplicate, skip
623 # duplicate, skip
624 continue
624 continue
625 if ref.endswith(PEELED_REF_MARKER):
625 if ref.endswith(PEELED_REF_MARKER):
626 log.debug("Skipping peeled reference %s", ref)
626 log.debug("Skipping peeled reference %s", ref)
627 continue
627 continue
628 # don't sync HEAD
628 # don't sync HEAD
629 if ref in ['HEAD']:
629 if ref in ['HEAD']:
630 continue
630 continue
631
631
632 remote_refs[ref] = sha
632 remote_refs[ref] = sha
633
633
634 if refs and sha in refs:
634 if refs and sha in refs:
635 # we filter fetch using our specified refs
635 # we filter fetch using our specified refs
636 fetch_refs.append('{}:{}'.format(ref, ref))
636 fetch_refs.append('{}:{}'.format(ref, ref))
637 elif not refs:
637 elif not refs:
638 fetch_refs.append('{}:{}'.format(ref, ref))
638 fetch_refs.append('{}:{}'.format(ref, ref))
639 log.debug('Finished obtaining fetch refs, total: %s', len(fetch_refs))
639 log.debug('Finished obtaining fetch refs, total: %s', len(fetch_refs))
640
640
641 if fetch_refs:
641 if fetch_refs:
642 for chunk in more_itertools.chunked(fetch_refs, 1024 * 4):
642 for chunk in more_itertools.chunked(fetch_refs, 1024 * 4):
643 fetch_refs_chunks = list(chunk)
643 fetch_refs_chunks = list(chunk)
644 log.debug('Fetching %s refs from import url', len(fetch_refs_chunks))
644 log.debug('Fetching %s refs from import url', len(fetch_refs_chunks))
645 _out, _err = self.run_git_command(
645 _out, _err = self.run_git_command(
646 wire, ['fetch', url, '--force', '--prune', '--'] + fetch_refs_chunks,
646 wire, ['fetch', url, '--force', '--prune', '--'] + fetch_refs_chunks,
647 fail_on_stderr=False,
647 fail_on_stderr=False,
648 _copts=self._remote_conf(config),
648 _copts=self._remote_conf(config),
649 extra_env={'GIT_TERMINAL_PROMPT': '0'})
649 extra_env={'GIT_TERMINAL_PROMPT': '0'})
650
650
651 return remote_refs
651 return remote_refs
652
652
653 @reraise_safe_exceptions
653 @reraise_safe_exceptions
654 def sync_push(self, wire, url, refs=None):
654 def sync_push(self, wire, url, refs=None):
655 if not self.check_url(url, wire):
655 if not self.check_url(url, wire):
656 return
656 return
657 config = self._wire_to_config(wire)
657 config = self._wire_to_config(wire)
658 self._factory.repo(wire)
658 self._factory.repo(wire)
659 self.run_git_command(
659 self.run_git_command(
660 wire, ['push', url, '--mirror'], fail_on_stderr=False,
660 wire, ['push', url, '--mirror'], fail_on_stderr=False,
661 _copts=self._remote_conf(config),
661 _copts=self._remote_conf(config),
662 extra_env={'GIT_TERMINAL_PROMPT': '0'})
662 extra_env={'GIT_TERMINAL_PROMPT': '0'})
663
663
664 @reraise_safe_exceptions
664 @reraise_safe_exceptions
665 def get_remote_refs(self, wire, url):
665 def get_remote_refs(self, wire, url):
666 repo = Repo(url)
666 repo = Repo(url)
667 return repo.get_refs()
667 return repo.get_refs()
668
668
669 @reraise_safe_exceptions
669 @reraise_safe_exceptions
670 def get_description(self, wire):
670 def get_description(self, wire):
671 repo = self._factory.repo(wire)
671 repo = self._factory.repo(wire)
672 return repo.get_description()
672 return repo.get_description()
673
673
674 @reraise_safe_exceptions
674 @reraise_safe_exceptions
675 def get_missing_revs(self, wire, rev1, rev2, path2):
675 def get_missing_revs(self, wire, rev1, rev2, path2):
676 repo = self._factory.repo(wire)
676 repo = self._factory.repo(wire)
677 LocalGitClient(thin_packs=False).fetch(path2, repo)
677 LocalGitClient(thin_packs=False).fetch(path2, repo)
678
678
679 wire_remote = wire.copy()
679 wire_remote = wire.copy()
680 wire_remote['path'] = path2
680 wire_remote['path'] = path2
681 repo_remote = self._factory.repo(wire_remote)
681 repo_remote = self._factory.repo(wire_remote)
682 LocalGitClient(thin_packs=False).fetch(wire["path"], repo_remote)
682 LocalGitClient(thin_packs=False).fetch(wire["path"], repo_remote)
683
683
684 revs = [
684 revs = [
685 x.commit.id
685 x.commit.id
686 for x in repo_remote.get_walker(include=[rev2], exclude=[rev1])]
686 for x in repo_remote.get_walker(include=[rev2], exclude=[rev1])]
687 return revs
687 return revs
688
688
689 @reraise_safe_exceptions
689 @reraise_safe_exceptions
690 def get_object(self, wire, sha):
690 def get_object(self, wire, sha):
691 cache_on, context_uid, repo_id = self._cache_on(wire)
691 cache_on, context_uid, repo_id = self._cache_on(wire)
692 @self.region.conditional_cache_on_arguments(condition=cache_on)
692 @self.region.conditional_cache_on_arguments(condition=cache_on)
693 def _get_object(_context_uid, _repo_id, _sha):
693 def _get_object(_context_uid, _repo_id, _sha):
694 repo_init = self._factory.repo_libgit2(wire)
694 repo_init = self._factory.repo_libgit2(wire)
695 with repo_init as repo:
695 with repo_init as repo:
696
696
697 missing_commit_err = 'Commit {} does not exist for `{}`'.format(sha, wire['path'])
697 missing_commit_err = 'Commit {} does not exist for `{}`'.format(sha, wire['path'])
698 try:
698 try:
699 commit = repo.revparse_single(sha)
699 commit = repo.revparse_single(sha)
700 except (KeyError, ValueError) as e:
700 except (KeyError, ValueError) as e:
701 raise exceptions.LookupException(e)(missing_commit_err)
701 raise exceptions.LookupException(e)(missing_commit_err)
702
702
703 is_tag = False
703 is_tag = False
704 if isinstance(commit, pygit2.Tag):
704 if isinstance(commit, pygit2.Tag):
705 commit = repo.get(commit.target)
705 commit = repo.get(commit.target)
706 is_tag = True
706 is_tag = True
707
707
708 check_dangling = True
708 check_dangling = True
709 if is_tag:
709 if is_tag:
710 check_dangling = False
710 check_dangling = False
711
711
712 # we used a reference and it parsed means we're not having a dangling commit
712 # we used a reference and it parsed means we're not having a dangling commit
713 if sha != commit.hex:
713 if sha != commit.hex:
714 check_dangling = False
714 check_dangling = False
715
715
716 if check_dangling:
716 if check_dangling:
717 # check for dangling commit
717 # check for dangling commit
718 for branch in repo.branches.with_commit(commit.hex):
718 for branch in repo.branches.with_commit(commit.hex):
719 if branch:
719 if branch:
720 break
720 break
721 else:
721 else:
722 raise exceptions.LookupException(None)(missing_commit_err)
722 raise exceptions.LookupException(None)(missing_commit_err)
723
723
724 commit_id = commit.hex
724 commit_id = commit.hex
725 type_id = commit.type
725 type_id = commit.type
726
726
727 return {
727 return {
728 'id': commit_id,
728 'id': commit_id,
729 'type': self._type_id_to_name(type_id),
729 'type': self._type_id_to_name(type_id),
730 'commit_id': commit_id,
730 'commit_id': commit_id,
731 'idx': 0
731 'idx': 0
732 }
732 }
733
733
734 return _get_object(context_uid, repo_id, sha)
734 return _get_object(context_uid, repo_id, sha)
735
735
736 @reraise_safe_exceptions
736 @reraise_safe_exceptions
737 def get_refs(self, wire):
737 def get_refs(self, wire):
738 cache_on, context_uid, repo_id = self._cache_on(wire)
738 cache_on, context_uid, repo_id = self._cache_on(wire)
739 @self.region.conditional_cache_on_arguments(condition=cache_on)
739 @self.region.conditional_cache_on_arguments(condition=cache_on)
740 def _get_refs(_context_uid, _repo_id):
740 def _get_refs(_context_uid, _repo_id):
741
741
742 repo_init = self._factory.repo_libgit2(wire)
742 repo_init = self._factory.repo_libgit2(wire)
743 with repo_init as repo:
743 with repo_init as repo:
744 regex = re.compile('^refs/(heads|tags)/')
744 regex = re.compile('^refs/(heads|tags)/')
745 return {x.name: x.target.hex for x in
745 return {x.name: x.target.hex for x in
746 filter(lambda ref: regex.match(ref.name) ,repo.listall_reference_objects())}
746 filter(lambda ref: regex.match(ref.name) ,repo.listall_reference_objects())}
747
747
748 return _get_refs(context_uid, repo_id)
748 return _get_refs(context_uid, repo_id)
749
749
750 @reraise_safe_exceptions
750 @reraise_safe_exceptions
751 def get_branch_pointers(self, wire):
751 def get_branch_pointers(self, wire):
752 cache_on, context_uid, repo_id = self._cache_on(wire)
752 cache_on, context_uid, repo_id = self._cache_on(wire)
753 @self.region.conditional_cache_on_arguments(condition=cache_on)
753 @self.region.conditional_cache_on_arguments(condition=cache_on)
754 def _get_branch_pointers(_context_uid, _repo_id):
754 def _get_branch_pointers(_context_uid, _repo_id):
755
755
756 repo_init = self._factory.repo_libgit2(wire)
756 repo_init = self._factory.repo_libgit2(wire)
757 regex = re.compile('^refs/heads')
757 regex = re.compile('^refs/heads')
758 with repo_init as repo:
758 with repo_init as repo:
759 branches = filter(lambda ref: regex.match(ref.name), repo.listall_reference_objects())
759 branches = filter(lambda ref: regex.match(ref.name), repo.listall_reference_objects())
760 return {x.target.hex: x.shorthand for x in branches}
760 return {x.target.hex: x.shorthand for x in branches}
761
761
762 return _get_branch_pointers(context_uid, repo_id)
762 return _get_branch_pointers(context_uid, repo_id)
763
763
764 @reraise_safe_exceptions
764 @reraise_safe_exceptions
765 def head(self, wire, show_exc=True):
765 def head(self, wire, show_exc=True):
766 cache_on, context_uid, repo_id = self._cache_on(wire)
766 cache_on, context_uid, repo_id = self._cache_on(wire)
767 @self.region.conditional_cache_on_arguments(condition=cache_on)
767 @self.region.conditional_cache_on_arguments(condition=cache_on)
768 def _head(_context_uid, _repo_id, _show_exc):
768 def _head(_context_uid, _repo_id, _show_exc):
769 repo_init = self._factory.repo_libgit2(wire)
769 repo_init = self._factory.repo_libgit2(wire)
770 with repo_init as repo:
770 with repo_init as repo:
771 try:
771 try:
772 return repo.head.peel().hex
772 return repo.head.peel().hex
773 except Exception:
773 except Exception:
774 if show_exc:
774 if show_exc:
775 raise
775 raise
776 return _head(context_uid, repo_id, show_exc)
776 return _head(context_uid, repo_id, show_exc)
777
777
778 @reraise_safe_exceptions
778 @reraise_safe_exceptions
779 def init(self, wire):
779 def init(self, wire):
780 repo_path = str_to_dulwich(wire['path'])
780 repo_path = str_to_dulwich(wire['path'])
781 self.repo = Repo.init(repo_path)
781 self.repo = Repo.init(repo_path)
782
782
783 @reraise_safe_exceptions
783 @reraise_safe_exceptions
784 def init_bare(self, wire):
784 def init_bare(self, wire):
785 repo_path = str_to_dulwich(wire['path'])
785 repo_path = str_to_dulwich(wire['path'])
786 self.repo = Repo.init_bare(repo_path)
786 self.repo = Repo.init_bare(repo_path)
787
787
788 @reraise_safe_exceptions
788 @reraise_safe_exceptions
789 def revision(self, wire, rev):
789 def revision(self, wire, rev):
790
790
791 cache_on, context_uid, repo_id = self._cache_on(wire)
791 cache_on, context_uid, repo_id = self._cache_on(wire)
792 @self.region.conditional_cache_on_arguments(condition=cache_on)
792 @self.region.conditional_cache_on_arguments(condition=cache_on)
793 def _revision(_context_uid, _repo_id, _rev):
793 def _revision(_context_uid, _repo_id, _rev):
794 repo_init = self._factory.repo_libgit2(wire)
794 repo_init = self._factory.repo_libgit2(wire)
795 with repo_init as repo:
795 with repo_init as repo:
796 commit = repo[rev]
796 commit = repo[rev]
797 obj_data = {
797 obj_data = {
798 'id': commit.id.hex,
798 'id': commit.id.hex,
799 }
799 }
800 # tree objects itself don't have tree_id attribute
800 # tree objects itself don't have tree_id attribute
801 if hasattr(commit, 'tree_id'):
801 if hasattr(commit, 'tree_id'):
802 obj_data['tree'] = commit.tree_id.hex
802 obj_data['tree'] = commit.tree_id.hex
803
803
804 return obj_data
804 return obj_data
805 return _revision(context_uid, repo_id, rev)
805 return _revision(context_uid, repo_id, rev)
806
806
807 @reraise_safe_exceptions
807 @reraise_safe_exceptions
808 def date(self, wire, commit_id):
808 def date(self, wire, commit_id):
809 cache_on, context_uid, repo_id = self._cache_on(wire)
809 cache_on, context_uid, repo_id = self._cache_on(wire)
810 @self.region.conditional_cache_on_arguments(condition=cache_on)
810 @self.region.conditional_cache_on_arguments(condition=cache_on)
811 def _date(_repo_id, _commit_id):
811 def _date(_repo_id, _commit_id):
812 repo_init = self._factory.repo_libgit2(wire)
812 repo_init = self._factory.repo_libgit2(wire)
813 with repo_init as repo:
813 with repo_init as repo:
814 commit = repo[commit_id]
814 commit = repo[commit_id]
815
815
816 if hasattr(commit, 'commit_time'):
816 if hasattr(commit, 'commit_time'):
817 commit_time, commit_time_offset = commit.commit_time, commit.commit_time_offset
817 commit_time, commit_time_offset = commit.commit_time, commit.commit_time_offset
818 else:
818 else:
819 commit = commit.get_object()
819 commit = commit.get_object()
820 commit_time, commit_time_offset = commit.commit_time, commit.commit_time_offset
820 commit_time, commit_time_offset = commit.commit_time, commit.commit_time_offset
821
821
822 # TODO(marcink): check dulwich difference of offset vs timezone
822 # TODO(marcink): check dulwich difference of offset vs timezone
823 return [commit_time, commit_time_offset]
823 return [commit_time, commit_time_offset]
824 return _date(repo_id, commit_id)
824 return _date(repo_id, commit_id)
825
825
826 @reraise_safe_exceptions
826 @reraise_safe_exceptions
827 def author(self, wire, commit_id):
827 def author(self, wire, commit_id):
828 cache_on, context_uid, repo_id = self._cache_on(wire)
828 cache_on, context_uid, repo_id = self._cache_on(wire)
829 @self.region.conditional_cache_on_arguments(condition=cache_on)
829 @self.region.conditional_cache_on_arguments(condition=cache_on)
830 def _author(_repo_id, _commit_id):
830 def _author(_repo_id, _commit_id):
831 repo_init = self._factory.repo_libgit2(wire)
831 repo_init = self._factory.repo_libgit2(wire)
832 with repo_init as repo:
832 with repo_init as repo:
833 commit = repo[commit_id]
833 commit = repo[commit_id]
834
834
835 if hasattr(commit, 'author'):
835 if hasattr(commit, 'author'):
836 author = commit.author
836 author = commit.author
837 else:
837 else:
838 author = commit.get_object().author
838 author = commit.get_object().author
839
839
840 if author.email:
840 if author.email:
841 return u"{} <{}>".format(author.name, author.email)
841 return u"{} <{}>".format(author.name, author.email)
842
842
843 return u"{}".format(author.raw_name)
843 try:
844 return u"{}".format(author.name)
845 except Exception:
846 return u"{}".format(safe_unicode(author.raw_name))
847
844 return _author(repo_id, commit_id)
848 return _author(repo_id, commit_id)
845
849
846 @reraise_safe_exceptions
850 @reraise_safe_exceptions
847 def message(self, wire, commit_id):
851 def message(self, wire, commit_id):
848 cache_on, context_uid, repo_id = self._cache_on(wire)
852 cache_on, context_uid, repo_id = self._cache_on(wire)
849 @self.region.conditional_cache_on_arguments(condition=cache_on)
853 @self.region.conditional_cache_on_arguments(condition=cache_on)
850 def _message(_repo_id, _commit_id):
854 def _message(_repo_id, _commit_id):
851 repo_init = self._factory.repo_libgit2(wire)
855 repo_init = self._factory.repo_libgit2(wire)
852 with repo_init as repo:
856 with repo_init as repo:
853 commit = repo[commit_id]
857 commit = repo[commit_id]
854 return commit.message
858 return commit.message
855 return _message(repo_id, commit_id)
859 return _message(repo_id, commit_id)
856
860
857 @reraise_safe_exceptions
861 @reraise_safe_exceptions
858 def parents(self, wire, commit_id):
862 def parents(self, wire, commit_id):
859 cache_on, context_uid, repo_id = self._cache_on(wire)
863 cache_on, context_uid, repo_id = self._cache_on(wire)
860 @self.region.conditional_cache_on_arguments(condition=cache_on)
864 @self.region.conditional_cache_on_arguments(condition=cache_on)
861 def _parents(_repo_id, _commit_id):
865 def _parents(_repo_id, _commit_id):
862 repo_init = self._factory.repo_libgit2(wire)
866 repo_init = self._factory.repo_libgit2(wire)
863 with repo_init as repo:
867 with repo_init as repo:
864 commit = repo[commit_id]
868 commit = repo[commit_id]
865 if hasattr(commit, 'parent_ids'):
869 if hasattr(commit, 'parent_ids'):
866 parent_ids = commit.parent_ids
870 parent_ids = commit.parent_ids
867 else:
871 else:
868 parent_ids = commit.get_object().parent_ids
872 parent_ids = commit.get_object().parent_ids
869
873
870 return [x.hex for x in parent_ids]
874 return [x.hex for x in parent_ids]
871 return _parents(repo_id, commit_id)
875 return _parents(repo_id, commit_id)
872
876
873 @reraise_safe_exceptions
877 @reraise_safe_exceptions
874 def children(self, wire, commit_id):
878 def children(self, wire, commit_id):
875 cache_on, context_uid, repo_id = self._cache_on(wire)
879 cache_on, context_uid, repo_id = self._cache_on(wire)
876 @self.region.conditional_cache_on_arguments(condition=cache_on)
880 @self.region.conditional_cache_on_arguments(condition=cache_on)
877 def _children(_repo_id, _commit_id):
881 def _children(_repo_id, _commit_id):
878 output, __ = self.run_git_command(
882 output, __ = self.run_git_command(
879 wire, ['rev-list', '--all', '--children'])
883 wire, ['rev-list', '--all', '--children'])
880
884
881 child_ids = []
885 child_ids = []
882 pat = re.compile(r'^%s' % commit_id)
886 pat = re.compile(r'^%s' % commit_id)
883 for l in output.splitlines():
887 for l in output.splitlines():
884 if pat.match(l):
888 if pat.match(l):
885 found_ids = l.split(' ')[1:]
889 found_ids = l.split(' ')[1:]
886 child_ids.extend(found_ids)
890 child_ids.extend(found_ids)
887
891
888 return child_ids
892 return child_ids
889 return _children(repo_id, commit_id)
893 return _children(repo_id, commit_id)
890
894
891 @reraise_safe_exceptions
895 @reraise_safe_exceptions
892 def set_refs(self, wire, key, value):
896 def set_refs(self, wire, key, value):
893 repo_init = self._factory.repo_libgit2(wire)
897 repo_init = self._factory.repo_libgit2(wire)
894 with repo_init as repo:
898 with repo_init as repo:
895 repo.references.create(key, value, force=True)
899 repo.references.create(key, value, force=True)
896
900
897 @reraise_safe_exceptions
901 @reraise_safe_exceptions
898 def create_branch(self, wire, branch_name, commit_id, force=False):
902 def create_branch(self, wire, branch_name, commit_id, force=False):
899 repo_init = self._factory.repo_libgit2(wire)
903 repo_init = self._factory.repo_libgit2(wire)
900 with repo_init as repo:
904 with repo_init as repo:
901 commit = repo[commit_id]
905 commit = repo[commit_id]
902
906
903 if force:
907 if force:
904 repo.branches.local.create(branch_name, commit, force=force)
908 repo.branches.local.create(branch_name, commit, force=force)
905 elif not repo.branches.get(branch_name):
909 elif not repo.branches.get(branch_name):
906 # create only if that branch isn't existing
910 # create only if that branch isn't existing
907 repo.branches.local.create(branch_name, commit, force=force)
911 repo.branches.local.create(branch_name, commit, force=force)
908
912
909 @reraise_safe_exceptions
913 @reraise_safe_exceptions
910 def remove_ref(self, wire, key):
914 def remove_ref(self, wire, key):
911 repo_init = self._factory.repo_libgit2(wire)
915 repo_init = self._factory.repo_libgit2(wire)
912 with repo_init as repo:
916 with repo_init as repo:
913 repo.references.delete(key)
917 repo.references.delete(key)
914
918
915 @reraise_safe_exceptions
919 @reraise_safe_exceptions
916 def tag_remove(self, wire, tag_name):
920 def tag_remove(self, wire, tag_name):
917 repo_init = self._factory.repo_libgit2(wire)
921 repo_init = self._factory.repo_libgit2(wire)
918 with repo_init as repo:
922 with repo_init as repo:
919 key = 'refs/tags/{}'.format(tag_name)
923 key = 'refs/tags/{}'.format(tag_name)
920 repo.references.delete(key)
924 repo.references.delete(key)
921
925
922 @reraise_safe_exceptions
926 @reraise_safe_exceptions
923 def tree_changes(self, wire, source_id, target_id):
927 def tree_changes(self, wire, source_id, target_id):
924 # TODO(marcink): remove this seems it's only used by tests
928 # TODO(marcink): remove this seems it's only used by tests
925 repo = self._factory.repo(wire)
929 repo = self._factory.repo(wire)
926 source = repo[source_id].tree if source_id else None
930 source = repo[source_id].tree if source_id else None
927 target = repo[target_id].tree
931 target = repo[target_id].tree
928 result = repo.object_store.tree_changes(source, target)
932 result = repo.object_store.tree_changes(source, target)
929 return list(result)
933 return list(result)
930
934
931 @reraise_safe_exceptions
935 @reraise_safe_exceptions
932 def tree_and_type_for_path(self, wire, commit_id, path):
936 def tree_and_type_for_path(self, wire, commit_id, path):
933
937
934 cache_on, context_uid, repo_id = self._cache_on(wire)
938 cache_on, context_uid, repo_id = self._cache_on(wire)
935 @self.region.conditional_cache_on_arguments(condition=cache_on)
939 @self.region.conditional_cache_on_arguments(condition=cache_on)
936 def _tree_and_type_for_path(_context_uid, _repo_id, _commit_id, _path):
940 def _tree_and_type_for_path(_context_uid, _repo_id, _commit_id, _path):
937 repo_init = self._factory.repo_libgit2(wire)
941 repo_init = self._factory.repo_libgit2(wire)
938
942
939 with repo_init as repo:
943 with repo_init as repo:
940 commit = repo[commit_id]
944 commit = repo[commit_id]
941 try:
945 try:
942 tree = commit.tree[path]
946 tree = commit.tree[path]
943 except KeyError:
947 except KeyError:
944 return None, None, None
948 return None, None, None
945
949
946 return tree.id.hex, tree.type, tree.filemode
950 return tree.id.hex, tree.type, tree.filemode
947 return _tree_and_type_for_path(context_uid, repo_id, commit_id, path)
951 return _tree_and_type_for_path(context_uid, repo_id, commit_id, path)
948
952
949 @reraise_safe_exceptions
953 @reraise_safe_exceptions
950 def tree_items(self, wire, tree_id):
954 def tree_items(self, wire, tree_id):
951 cache_on, context_uid, repo_id = self._cache_on(wire)
955 cache_on, context_uid, repo_id = self._cache_on(wire)
952 @self.region.conditional_cache_on_arguments(condition=cache_on)
956 @self.region.conditional_cache_on_arguments(condition=cache_on)
953 def _tree_items(_repo_id, _tree_id):
957 def _tree_items(_repo_id, _tree_id):
954
958
955 repo_init = self._factory.repo_libgit2(wire)
959 repo_init = self._factory.repo_libgit2(wire)
956 with repo_init as repo:
960 with repo_init as repo:
957 try:
961 try:
958 tree = repo[tree_id]
962 tree = repo[tree_id]
959 except KeyError:
963 except KeyError:
960 raise ObjectMissing('No tree with id: {}'.format(tree_id))
964 raise ObjectMissing('No tree with id: {}'.format(tree_id))
961
965
962 result = []
966 result = []
963 for item in tree:
967 for item in tree:
964 item_sha = item.hex
968 item_sha = item.hex
965 item_mode = item.filemode
969 item_mode = item.filemode
966 item_type = item.type
970 item_type = item.type
967
971
968 if item_type == 'commit':
972 if item_type == 'commit':
969 # NOTE(marcink): submodules we translate to 'link' for backward compat
973 # NOTE(marcink): submodules we translate to 'link' for backward compat
970 item_type = 'link'
974 item_type = 'link'
971
975
972 result.append((item.name, item_mode, item_sha, item_type))
976 result.append((item.name, item_mode, item_sha, item_type))
973 return result
977 return result
974 return _tree_items(repo_id, tree_id)
978 return _tree_items(repo_id, tree_id)
975
979
976 @reraise_safe_exceptions
980 @reraise_safe_exceptions
977 def diff_2(self, wire, commit_id_1, commit_id_2, file_filter, opt_ignorews, context):
981 def diff_2(self, wire, commit_id_1, commit_id_2, file_filter, opt_ignorews, context):
978 """
982 """
979 Old version that uses subprocess to call diff
983 Old version that uses subprocess to call diff
980 """
984 """
981
985
982 flags = [
986 flags = [
983 '-U%s' % context, '--patch',
987 '-U%s' % context, '--patch',
984 '--binary',
988 '--binary',
985 '--find-renames',
989 '--find-renames',
986 '--no-indent-heuristic',
990 '--no-indent-heuristic',
987 # '--indent-heuristic',
991 # '--indent-heuristic',
988 #'--full-index',
992 #'--full-index',
989 #'--abbrev=40'
993 #'--abbrev=40'
990 ]
994 ]
991
995
992 if opt_ignorews:
996 if opt_ignorews:
993 flags.append('--ignore-all-space')
997 flags.append('--ignore-all-space')
994
998
995 if commit_id_1 == self.EMPTY_COMMIT:
999 if commit_id_1 == self.EMPTY_COMMIT:
996 cmd = ['show'] + flags + [commit_id_2]
1000 cmd = ['show'] + flags + [commit_id_2]
997 else:
1001 else:
998 cmd = ['diff'] + flags + [commit_id_1, commit_id_2]
1002 cmd = ['diff'] + flags + [commit_id_1, commit_id_2]
999
1003
1000 if file_filter:
1004 if file_filter:
1001 cmd.extend(['--', file_filter])
1005 cmd.extend(['--', file_filter])
1002
1006
1003 diff, __ = self.run_git_command(wire, cmd)
1007 diff, __ = self.run_git_command(wire, cmd)
1004 # If we used 'show' command, strip first few lines (until actual diff
1008 # If we used 'show' command, strip first few lines (until actual diff
1005 # starts)
1009 # starts)
1006 if commit_id_1 == self.EMPTY_COMMIT:
1010 if commit_id_1 == self.EMPTY_COMMIT:
1007 lines = diff.splitlines()
1011 lines = diff.splitlines()
1008 x = 0
1012 x = 0
1009 for line in lines:
1013 for line in lines:
1010 if line.startswith('diff'):
1014 if line.startswith('diff'):
1011 break
1015 break
1012 x += 1
1016 x += 1
1013 # Append new line just like 'diff' command do
1017 # Append new line just like 'diff' command do
1014 diff = '\n'.join(lines[x:]) + '\n'
1018 diff = '\n'.join(lines[x:]) + '\n'
1015 return diff
1019 return diff
1016
1020
1017 @reraise_safe_exceptions
1021 @reraise_safe_exceptions
1018 def diff(self, wire, commit_id_1, commit_id_2, file_filter, opt_ignorews, context):
1022 def diff(self, wire, commit_id_1, commit_id_2, file_filter, opt_ignorews, context):
1019 repo_init = self._factory.repo_libgit2(wire)
1023 repo_init = self._factory.repo_libgit2(wire)
1020 with repo_init as repo:
1024 with repo_init as repo:
1021 swap = True
1025 swap = True
1022 flags = 0
1026 flags = 0
1023 flags |= pygit2.GIT_DIFF_SHOW_BINARY
1027 flags |= pygit2.GIT_DIFF_SHOW_BINARY
1024
1028
1025 if opt_ignorews:
1029 if opt_ignorews:
1026 flags |= pygit2.GIT_DIFF_IGNORE_WHITESPACE
1030 flags |= pygit2.GIT_DIFF_IGNORE_WHITESPACE
1027
1031
1028 if commit_id_1 == self.EMPTY_COMMIT:
1032 if commit_id_1 == self.EMPTY_COMMIT:
1029 comm1 = repo[commit_id_2]
1033 comm1 = repo[commit_id_2]
1030 diff_obj = comm1.tree.diff_to_tree(
1034 diff_obj = comm1.tree.diff_to_tree(
1031 flags=flags, context_lines=context, swap=swap)
1035 flags=flags, context_lines=context, swap=swap)
1032
1036
1033 else:
1037 else:
1034 comm1 = repo[commit_id_2]
1038 comm1 = repo[commit_id_2]
1035 comm2 = repo[commit_id_1]
1039 comm2 = repo[commit_id_1]
1036 diff_obj = comm1.tree.diff_to_tree(
1040 diff_obj = comm1.tree.diff_to_tree(
1037 comm2.tree, flags=flags, context_lines=context, swap=swap)
1041 comm2.tree, flags=flags, context_lines=context, swap=swap)
1038 similar_flags = 0
1042 similar_flags = 0
1039 similar_flags |= pygit2.GIT_DIFF_FIND_RENAMES
1043 similar_flags |= pygit2.GIT_DIFF_FIND_RENAMES
1040 diff_obj.find_similar(flags=similar_flags)
1044 diff_obj.find_similar(flags=similar_flags)
1041
1045
1042 if file_filter:
1046 if file_filter:
1043 for p in diff_obj:
1047 for p in diff_obj:
1044 if p.delta.old_file.path == file_filter:
1048 if p.delta.old_file.path == file_filter:
1045 return p.patch or ''
1049 return p.patch or ''
1046 # fo matching path == no diff
1050 # fo matching path == no diff
1047 return ''
1051 return ''
1048 return diff_obj.patch or ''
1052 return diff_obj.patch or ''
1049
1053
1050 @reraise_safe_exceptions
1054 @reraise_safe_exceptions
1051 def node_history(self, wire, commit_id, path, limit):
1055 def node_history(self, wire, commit_id, path, limit):
1052 cache_on, context_uid, repo_id = self._cache_on(wire)
1056 cache_on, context_uid, repo_id = self._cache_on(wire)
1053 @self.region.conditional_cache_on_arguments(condition=cache_on)
1057 @self.region.conditional_cache_on_arguments(condition=cache_on)
1054 def _node_history(_context_uid, _repo_id, _commit_id, _path, _limit):
1058 def _node_history(_context_uid, _repo_id, _commit_id, _path, _limit):
1055 # optimize for n==1, rev-list is much faster for that use-case
1059 # optimize for n==1, rev-list is much faster for that use-case
1056 if limit == 1:
1060 if limit == 1:
1057 cmd = ['rev-list', '-1', commit_id, '--', path]
1061 cmd = ['rev-list', '-1', commit_id, '--', path]
1058 else:
1062 else:
1059 cmd = ['log']
1063 cmd = ['log']
1060 if limit:
1064 if limit:
1061 cmd.extend(['-n', str(safe_int(limit, 0))])
1065 cmd.extend(['-n', str(safe_int(limit, 0))])
1062 cmd.extend(['--pretty=format: %H', '-s', commit_id, '--', path])
1066 cmd.extend(['--pretty=format: %H', '-s', commit_id, '--', path])
1063
1067
1064 output, __ = self.run_git_command(wire, cmd)
1068 output, __ = self.run_git_command(wire, cmd)
1065 commit_ids = re.findall(r'[0-9a-fA-F]{40}', output)
1069 commit_ids = re.findall(r'[0-9a-fA-F]{40}', output)
1066
1070
1067 return [x for x in commit_ids]
1071 return [x for x in commit_ids]
1068 return _node_history(context_uid, repo_id, commit_id, path, limit)
1072 return _node_history(context_uid, repo_id, commit_id, path, limit)
1069
1073
1070 @reraise_safe_exceptions
1074 @reraise_safe_exceptions
1071 def node_annotate(self, wire, commit_id, path):
1075 def node_annotate(self, wire, commit_id, path):
1072
1076
1073 cmd = ['blame', '-l', '--root', '-r', commit_id, '--', path]
1077 cmd = ['blame', '-l', '--root', '-r', commit_id, '--', path]
1074 # -l ==> outputs long shas (and we need all 40 characters)
1078 # -l ==> outputs long shas (and we need all 40 characters)
1075 # --root ==> doesn't put '^' character for boundaries
1079 # --root ==> doesn't put '^' character for boundaries
1076 # -r commit_id ==> blames for the given commit
1080 # -r commit_id ==> blames for the given commit
1077 output, __ = self.run_git_command(wire, cmd)
1081 output, __ = self.run_git_command(wire, cmd)
1078
1082
1079 result = []
1083 result = []
1080 for i, blame_line in enumerate(output.split('\n')[:-1]):
1084 for i, blame_line in enumerate(output.split('\n')[:-1]):
1081 line_no = i + 1
1085 line_no = i + 1
1082 commit_id, line = re.split(r' ', blame_line, 1)
1086 commit_id, line = re.split(r' ', blame_line, 1)
1083 result.append((line_no, commit_id, line))
1087 result.append((line_no, commit_id, line))
1084 return result
1088 return result
1085
1089
1086 @reraise_safe_exceptions
1090 @reraise_safe_exceptions
1087 def update_server_info(self, wire):
1091 def update_server_info(self, wire):
1088 repo = self._factory.repo(wire)
1092 repo = self._factory.repo(wire)
1089 update_server_info(repo)
1093 update_server_info(repo)
1090
1094
1091 @reraise_safe_exceptions
1095 @reraise_safe_exceptions
1092 def get_all_commit_ids(self, wire):
1096 def get_all_commit_ids(self, wire):
1093
1097
1094 cache_on, context_uid, repo_id = self._cache_on(wire)
1098 cache_on, context_uid, repo_id = self._cache_on(wire)
1095 @self.region.conditional_cache_on_arguments(condition=cache_on)
1099 @self.region.conditional_cache_on_arguments(condition=cache_on)
1096 def _get_all_commit_ids(_context_uid, _repo_id):
1100 def _get_all_commit_ids(_context_uid, _repo_id):
1097
1101
1098 cmd = ['rev-list', '--reverse', '--date-order', '--branches', '--tags']
1102 cmd = ['rev-list', '--reverse', '--date-order', '--branches', '--tags']
1099 try:
1103 try:
1100 output, __ = self.run_git_command(wire, cmd)
1104 output, __ = self.run_git_command(wire, cmd)
1101 return output.splitlines()
1105 return output.splitlines()
1102 except Exception:
1106 except Exception:
1103 # Can be raised for empty repositories
1107 # Can be raised for empty repositories
1104 return []
1108 return []
1105 return _get_all_commit_ids(context_uid, repo_id)
1109 return _get_all_commit_ids(context_uid, repo_id)
1106
1110
1107 @reraise_safe_exceptions
1111 @reraise_safe_exceptions
1108 def run_git_command(self, wire, cmd, **opts):
1112 def run_git_command(self, wire, cmd, **opts):
1109 path = wire.get('path', None)
1113 path = wire.get('path', None)
1110
1114
1111 if path and os.path.isdir(path):
1115 if path and os.path.isdir(path):
1112 opts['cwd'] = path
1116 opts['cwd'] = path
1113
1117
1114 if '_bare' in opts:
1118 if '_bare' in opts:
1115 _copts = []
1119 _copts = []
1116 del opts['_bare']
1120 del opts['_bare']
1117 else:
1121 else:
1118 _copts = ['-c', 'core.quotepath=false', ]
1122 _copts = ['-c', 'core.quotepath=false', ]
1119 safe_call = False
1123 safe_call = False
1120 if '_safe' in opts:
1124 if '_safe' in opts:
1121 # no exc on failure
1125 # no exc on failure
1122 del opts['_safe']
1126 del opts['_safe']
1123 safe_call = True
1127 safe_call = True
1124
1128
1125 if '_copts' in opts:
1129 if '_copts' in opts:
1126 _copts.extend(opts['_copts'] or [])
1130 _copts.extend(opts['_copts'] or [])
1127 del opts['_copts']
1131 del opts['_copts']
1128
1132
1129 gitenv = os.environ.copy()
1133 gitenv = os.environ.copy()
1130 gitenv.update(opts.pop('extra_env', {}))
1134 gitenv.update(opts.pop('extra_env', {}))
1131 # need to clean fix GIT_DIR !
1135 # need to clean fix GIT_DIR !
1132 if 'GIT_DIR' in gitenv:
1136 if 'GIT_DIR' in gitenv:
1133 del gitenv['GIT_DIR']
1137 del gitenv['GIT_DIR']
1134 gitenv['GIT_CONFIG_NOGLOBAL'] = '1'
1138 gitenv['GIT_CONFIG_NOGLOBAL'] = '1'
1135 gitenv['GIT_DISCOVERY_ACROSS_FILESYSTEM'] = '1'
1139 gitenv['GIT_DISCOVERY_ACROSS_FILESYSTEM'] = '1'
1136
1140
1137 cmd = [settings.GIT_EXECUTABLE] + _copts + cmd
1141 cmd = [settings.GIT_EXECUTABLE] + _copts + cmd
1138 _opts = {'env': gitenv, 'shell': False}
1142 _opts = {'env': gitenv, 'shell': False}
1139
1143
1140 proc = None
1144 proc = None
1141 try:
1145 try:
1142 _opts.update(opts)
1146 _opts.update(opts)
1143 proc = subprocessio.SubprocessIOChunker(cmd, **_opts)
1147 proc = subprocessio.SubprocessIOChunker(cmd, **_opts)
1144
1148
1145 return ''.join(proc), ''.join(proc.error)
1149 return ''.join(proc), ''.join(proc.error)
1146 except (EnvironmentError, OSError) as err:
1150 except (EnvironmentError, OSError) as err:
1147 cmd = ' '.join(cmd) # human friendly CMD
1151 cmd = ' '.join(cmd) # human friendly CMD
1148 tb_err = ("Couldn't run git command (%s).\n"
1152 tb_err = ("Couldn't run git command (%s).\n"
1149 "Original error was:%s\n"
1153 "Original error was:%s\n"
1150 "Call options:%s\n"
1154 "Call options:%s\n"
1151 % (cmd, err, _opts))
1155 % (cmd, err, _opts))
1152 log.exception(tb_err)
1156 log.exception(tb_err)
1153 if safe_call:
1157 if safe_call:
1154 return '', err
1158 return '', err
1155 else:
1159 else:
1156 raise exceptions.VcsException()(tb_err)
1160 raise exceptions.VcsException()(tb_err)
1157 finally:
1161 finally:
1158 if proc:
1162 if proc:
1159 proc.close()
1163 proc.close()
1160
1164
1161 @reraise_safe_exceptions
1165 @reraise_safe_exceptions
1162 def install_hooks(self, wire, force=False):
1166 def install_hooks(self, wire, force=False):
1163 from vcsserver.hook_utils import install_git_hooks
1167 from vcsserver.hook_utils import install_git_hooks
1164 bare = self.bare(wire)
1168 bare = self.bare(wire)
1165 path = wire['path']
1169 path = wire['path']
1166 return install_git_hooks(path, bare, force_create=force)
1170 return install_git_hooks(path, bare, force_create=force)
1167
1171
1168 @reraise_safe_exceptions
1172 @reraise_safe_exceptions
1169 def get_hooks_info(self, wire):
1173 def get_hooks_info(self, wire):
1170 from vcsserver.hook_utils import (
1174 from vcsserver.hook_utils import (
1171 get_git_pre_hook_version, get_git_post_hook_version)
1175 get_git_pre_hook_version, get_git_post_hook_version)
1172 bare = self.bare(wire)
1176 bare = self.bare(wire)
1173 path = wire['path']
1177 path = wire['path']
1174 return {
1178 return {
1175 'pre_version': get_git_pre_hook_version(path, bare),
1179 'pre_version': get_git_pre_hook_version(path, bare),
1176 'post_version': get_git_post_hook_version(path, bare),
1180 'post_version': get_git_post_hook_version(path, bare),
1177 }
1181 }
@@ -1,89 +1,110 b''
1 # RhodeCode VCSServer provides access to different vcs backends via network.
1 # RhodeCode VCSServer provides access to different vcs backends via network.
2 # Copyright (C) 2014-2019 RhodeCode GmbH
2 # Copyright (C) 2014-2019 RhodeCode GmbH
3 #
3 #
4 # This program is free software; you can redistribute it and/or modify
4 # This program is free software; you can redistribute it and/or modify
5 # it under the terms of the GNU General Public License as published by
5 # it under the terms of the GNU General Public License as published by
6 # the Free Software Foundation; either version 3 of the License, or
6 # the Free Software Foundation; either version 3 of the License, or
7 # (at your option) any later version.
7 # (at your option) any later version.
8 #
8 #
9 # This program is distributed in the hope that it will be useful,
9 # This program is distributed in the hope that it will be useful,
10 # but WITHOUT ANY WARRANTY; without even the implied warranty of
10 # but WITHOUT ANY WARRANTY; without even the implied warranty of
11 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
11 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 # GNU General Public License for more details.
12 # GNU General Public License for more details.
13 #
13 #
14 # You should have received a copy of the GNU General Public License
14 # You should have received a copy of the GNU General Public License
15 # along with this program; if not, write to the Free Software Foundation,
15 # along with this program; if not, write to the Free Software Foundation,
16 # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
16 # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
17 import logging
17 import logging
18 import hashlib
18 import hashlib
19
19
20 log = logging.getLogger(__name__)
20 log = logging.getLogger(__name__)
21
21
22
22
23 def safe_int(val, default=None):
23 def safe_int(val, default=None):
24 """
24 """
25 Returns int() of val if val is not convertable to int use default
25 Returns int() of val if val is not convertable to int use default
26 instead
26 instead
27
27
28 :param val:
28 :param val:
29 :param default:
29 :param default:
30 """
30 """
31
31
32 try:
32 try:
33 val = int(val)
33 val = int(val)
34 except (ValueError, TypeError):
34 except (ValueError, TypeError):
35 val = default
35 val = default
36
36
37 return val
37 return val
38
38
39
39
40 def safe_str(unicode_, to_encoding=['utf8']):
40 def safe_str(unicode_, to_encoding=None):
41 """
41 """
42 safe str function. Does few trick to turn unicode_ into string
42 safe str function. Does few trick to turn unicode_ into string
43
43
44 In case of UnicodeEncodeError, we try to return it with encoding detected
45 by chardet library if it fails fallback to string with errors replaced
46
47 :param unicode_: unicode to encode
44 :param unicode_: unicode to encode
45 :param to_encoding: encode to this type UTF8 default
48 :rtype: str
46 :rtype: str
49 :returns: str object
47 :returns: str object
50 """
48 """
51
49 to_encoding = to_encoding or ['utf8']
52 # if it's not basestr cast to str
50 # if it's not basestr cast to str
53 if not isinstance(unicode_, basestring):
51 if not isinstance(unicode_, basestring):
54 return str(unicode_)
52 return str(unicode_)
55
53
56 if isinstance(unicode_, str):
54 if isinstance(unicode_, str):
57 return unicode_
55 return unicode_
58
56
59 if not isinstance(to_encoding, (list, tuple)):
57 if not isinstance(to_encoding, (list, tuple)):
60 to_encoding = [to_encoding]
58 to_encoding = [to_encoding]
61
59
62 for enc in to_encoding:
60 for enc in to_encoding:
63 try:
61 try:
64 return unicode_.encode(enc)
62 return unicode_.encode(enc)
65 except UnicodeEncodeError:
63 except UnicodeEncodeError:
66 pass
64 pass
67
65
66 return unicode_.encode(to_encoding[0], 'replace')
67
68
69 def safe_unicode(str_, from_encoding=None):
70 """
71 safe unicode function. Does few trick to turn str_ into unicode
72
73 :param str_: string to decode
74 :param from_encoding: encode from this type UTF8 default
75 :rtype: unicode
76 :returns: unicode object
77 """
78 from_encoding = from_encoding or ['utf8']
79
80 if isinstance(str_, unicode):
81 return str_
82
83 if not isinstance(from_encoding, (list, tuple)):
84 from_encoding = [from_encoding]
85
68 try:
86 try:
69 import chardet
87 return unicode(str_)
70 encoding = chardet.detect(unicode_)['encoding']
88 except UnicodeDecodeError:
71 if encoding is None:
89 pass
72 raise UnicodeEncodeError()
73
90
74 return unicode_.encode(encoding)
91 for enc in from_encoding:
75 except (ImportError, UnicodeEncodeError):
92 try:
76 return unicode_.encode(to_encoding[0], 'replace')
93 return unicode(str_, enc)
94 except UnicodeDecodeError:
95 pass
96
97 return unicode(str_, from_encoding[0], 'replace')
77
98
78
99
79 class AttributeDict(dict):
100 class AttributeDict(dict):
80 def __getattr__(self, attr):
101 def __getattr__(self, attr):
81 return self.get(attr, None)
102 return self.get(attr, None)
82 __setattr__ = dict.__setitem__
103 __setattr__ = dict.__setitem__
83 __delattr__ = dict.__delitem__
104 __delattr__ = dict.__delitem__
84
105
85
106
86 def sha1(val):
107 def sha1(val):
87 return hashlib.sha1(val).hexdigest()
108 return hashlib.sha1(val).hexdigest()
88
109
89
110
General Comments 0
You need to be logged in to leave comments. Login now