rhodecode-enterprise-ce Commit - r4352:122ebfb8

1

# -*- coding: utf-8 -*-

1

# -*- coding: utf-8 -*-

2

3

4

#

4

#

5

# This program is free software: you can redistribute it and/or modify

5

# This program is free software: you can redistribute it and/or modify

6

# it under the terms of the GNU Affero General Public License, version 3

6

# it under the terms of the GNU Affero General Public License, version 3

7

# (only), as published by the Free Software Foundation.

7

# (only), as published by the Free Software Foundation.

8

#

8

#

9

# This program is distributed in the hope that it will be useful,

9

# This program is distributed in the hope that it will be useful,

10

# but WITHOUT ANY WARRANTY; without even the implied warranty of

10

# but WITHOUT ANY WARRANTY; without even the implied warranty of

11

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

11

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

12

# GNU General Public License for more details.

12

# GNU General Public License for more details.

13

#

13

#

14

# You should have received a copy of the GNU Affero General Public License

14

# You should have received a copy of the GNU Affero General Public License

15

# along with this program. If not, see <http://www.gnu.org/licenses/>.

15

# along with this program. If not, see <http://www.gnu.org/licenses/>.

16

#

16

#

17

# This program is dual-licensed. If you wish to learn more about the

17

# This program is dual-licensed. If you wish to learn more about the

18

# RhodeCode Enterprise Edition, including its added features, Support services,

18

# RhodeCode Enterprise Edition, including its added features, Support services,

19

# and proprietary license terms, please see https://rhodecode.com/licenses/

19

# and proprietary license terms, please see https://rhodecode.com/licenses/

20

21

"""

21

"""

22

Implementation of the scm_app interface using raw HTTP communication.

22

Implementation of the scm_app interface using raw HTTP communication.

23

"""

23

"""

24

25

import base64

25

import base64

26

import logging

26

import logging

27

import urlparse

27

import urlparse

28

import wsgiref.util

28

import wsgiref.util

29

30

import msgpack

30

import msgpack

31

import requests

31

import requests

32

import webob.request

32

import webob.request

33

34

import rhodecode

34

import rhodecode

35

36

37

log = logging.getLogger(__name__)

37

log = logging.getLogger(__name__)

38

39

40

def create_git_wsgi_app(repo_path, repo_name, config):

40

def create_git_wsgi_app(repo_path, repo_name, config):

41

url = _vcs_streaming_url() + 'git/'

41

url = _vcs_streaming_url() + 'git/'

42

return VcsHttpProxy(url, repo_path, repo_name, config)

42

return VcsHttpProxy(url, repo_path, repo_name, config)

43

44

45

def create_hg_wsgi_app(repo_path, repo_name, config):

45

def create_hg_wsgi_app(repo_path, repo_name, config):

46

url = _vcs_streaming_url() + 'hg/'

46

url = _vcs_streaming_url() + 'hg/'

47

return VcsHttpProxy(url, repo_path, repo_name, config)

47

return VcsHttpProxy(url, repo_path, repo_name, config)

48

49

50

def _vcs_streaming_url():

50

def _vcs_streaming_url():

51

template = 'http://{}/stream/'

51

template = 'http://{}/stream/'

52

return template.format(rhodecode.CONFIG['vcs.server'])

52

return template.format(rhodecode.CONFIG['vcs.server'])

53

54

55

# TODO: johbo: Avoid the global.

55

# TODO: johbo: Avoid the global.

56

session = requests.Session()

56

session = requests.Session()

57

# Requests speedup, avoid reading .netrc and similar

57

# Requests speedup, avoid reading .netrc and similar

58

session.trust_env = False

58

session.trust_env = False

59

60

# prevent urllib3 spawning our logs.

60

# prevent urllib3 spawning our logs.

61

logging.getLogger("requests.packages.urllib3.connectionpool").setLevel(

61

logging.getLogger("requests.packages.urllib3.connectionpool").setLevel(

62

logging.WARNING)

62

logging.WARNING)

63

64

65

class VcsHttpProxy(object):

65

class VcsHttpProxy(object):

66

"""

66

"""

67

A WSGI application which proxies vcs requests.

67

A WSGI application which proxies vcs requests.

68

69

The goal is to shuffle the data around without touching it. The only

69

The goal is to shuffle the data around without touching it. The only

70

exception is the extra data from the config object which we send to the

70

exception is the extra data from the config object which we send to the

71

server as well.

71

server as well.

72

"""

72

"""

73

74

def __init__(self, url, repo_path, repo_name, config):

74

def __init__(self, url, repo_path, repo_name, config):

75

"""

75

"""

76

:param str url: The URL of the VCSServer to call.

76

:param str url: The URL of the VCSServer to call.

77

"""

77

"""

78

self._url = url

78

self._url = url

79

self._repo_name = repo_name

79

self._repo_name = repo_name

80

self._repo_path = repo_path

80

self._repo_path = repo_path

81

self._config = config

81

self._config = config

82

self.rc_extras = {}

82

log.debug(

83

log.debug(

83

"Creating VcsHttpProxy for repo %s, url %s",

84

"Creating VcsHttpProxy for repo %s, url %s",

84

repo_name, url)

85

repo_name, url)

85

86

def __call__(self, environ, start_response):

87

def __call__(self, environ, start_response):

87

config = msgpack.packb(self._config)

88

config = msgpack.packb(self._config)

88

request = webob.request.Request(environ)

89

request = webob.request.Request(environ)

89

request_headers = request.headers

90

request_headers = request.headers

91

90

request_headers.update({

92

request_headers.update({

91

# TODO: johbo: Remove this, rely on URL path only

93

# TODO: johbo: Remove this, rely on URL path only

92

'X-RC-Repo-Name': self._repo_name,

94

'X-RC-Repo-Name': self._repo_name,

93

'X-RC-Repo-Path': self._repo_path,

95

'X-RC-Repo-Path': self._repo_path,

94

'X-RC-Path-Info': environ['PATH_INFO'],

96

'X-RC-Path-Info': environ['PATH_INFO'],

97

98

'X-RC-Repo-Store': self.rc_extras.get('repo_store'),

99

'X-RC-Server-Config-File': self.rc_extras.get('config'),

100

101

'X-RC-Auth-User': self.rc_extras.get('username'),

102

'X-RC-Auth-User-Id': self.rc_extras.get('user_id'),

103

'X-RC-Auth-User-Ip': self.rc_extras.get('ip'),

104

95

# TODO: johbo: Avoid encoding and put this into payload?

105

# TODO: johbo: Avoid encoding and put this into payload?

96

'X-RC-Repo-Config': base64.b64encode(config),

106

'X-RC-Repo-Config': base64.b64encode(config),

97

'X-RC-Locked-Status-Code': rhodecode.CONFIG.get('lock_ret_code')

107

'X-RC-Locked-Status-Code': rhodecode.CONFIG.get('lock_ret_code'),

98

})

108

})

99

109

100

method = environ['REQUEST_METHOD']

110

method = environ['REQUEST_METHOD']

101

111

102

# Preserve the query string

112

# Preserve the query string

103

url = self._url

113

url = self._url

104

url = urlparse.urljoin(url, self._repo_name)

114

url = urlparse.urljoin(url, self._repo_name)

105

if environ.get('QUERY_STRING'):

115

if environ.get('QUERY_STRING'):

106

url += '?' + environ['QUERY_STRING']

116

url += '?' + environ['QUERY_STRING']

107

117

108

log.debug('http-app: preparing request to: %s', url)

118

log.debug('http-app: preparing request to: %s', url)

109

response = session.request(

119

response = session.request(

110

method,

120

method,

111

url,

121

url,

112

data=_maybe_stream_request(environ),

122

data=_maybe_stream_request(environ),

113

headers=request_headers,

123

headers=request_headers,

114

stream=True)

124

stream=True)

115

125

116

log.debug('http-app: got vcsserver response: %s', response)

126

log.debug('http-app: got vcsserver response: %s', response)

117

if response.status_code >= 500:

127

if response.status_code >= 500:

118

log.error('Exception returned by vcsserver at: %s %s, %s',

128

log.error('Exception returned by vcsserver at: %s %s, %s',

119

url, response.status_code, response.content)

129

url, response.status_code, response.content)

120

130

121

# Preserve the headers of the response, except hop_by_hop ones

131

# Preserve the headers of the response, except hop_by_hop ones

122

response_headers = [

132

response_headers = [

123

(h, v) for h, v in response.headers.items()

133

(h, v) for h, v in response.headers.items()

124

if not wsgiref.util.is_hop_by_hop(h)

134

if not wsgiref.util.is_hop_by_hop(h)

125

]

135

]

126

136

127

# Build status argument for start_response callable.

137

# Build status argument for start_response callable.

128

status = '{status_code} {reason_phrase}'.format(

138

status = '{status_code} {reason_phrase}'.format(

129

status_code=response.status_code,

139

status_code=response.status_code,

130

reason_phrase=response.reason)

140

reason_phrase=response.reason)

131

141

132

start_response(status, response_headers)

142

start_response(status, response_headers)

133

return _maybe_stream_response(response)

143

return _maybe_stream_response(response)

134

144

135

145

136

def read_in_chunks(stream_obj, block_size=1024, chunks=-1):

146

def read_in_chunks(stream_obj, block_size=1024, chunks=-1):

137

"""

147

"""

138

Read Stream in chunks, default chunk size: 1k.

148

Read Stream in chunks, default chunk size: 1k.

139

"""

149

"""

140

while chunks:

150

while chunks:

141

data = stream_obj.read(block_size)

151

data = stream_obj.read(block_size)

142

if not data:

152

if not data:

143

break

153

break

144

yield data

154

yield data

145

chunks -= 1

155

chunks -= 1

146

156

147

157

148

def _is_request_chunked(environ):

158

def _is_request_chunked(environ):

149

stream = environ.get('HTTP_TRANSFER_ENCODING', '') == 'chunked'

159

stream = environ.get('HTTP_TRANSFER_ENCODING', '') == 'chunked'

150

return stream

160

return stream

151

161

152

162

153

def _maybe_stream_request(environ):

163

def _maybe_stream_request(environ):

154

path = environ['PATH_INFO']

164

path = environ['PATH_INFO']

155

stream = _is_request_chunked(environ)

165

stream = _is_request_chunked(environ)

156

log.debug('handling request `%s` with stream support: %s', path, stream)

166

log.debug('handling request `%s` with stream support: %s', path, stream)

157

167

158

if stream:

168

if stream:

159

# set stream by 256k

169

# set stream by 256k

160

return read_in_chunks(environ['wsgi.input'], block_size=1024 * 256)

170

return read_in_chunks(environ['wsgi.input'], block_size=1024 * 256)

161

else:

171

else:

162

return environ['wsgi.input'].read()

172

return environ['wsgi.input'].read()

163

173

164

174

165

def _maybe_stream_response(response):

175

def _maybe_stream_response(response):

166

"""

176

"""

167

Try to generate chunks from the response if it is chunked.

177

Try to generate chunks from the response if it is chunked.

168

"""

178

"""

169

stream = _is_chunked(response)

179

stream = _is_chunked(response)

170

log.debug('returning response with stream: %s', stream)

180

log.debug('returning response with stream: %s', stream)

171

if stream:

181

if stream:

172

# read in 256k Chunks

182

# read in 256k Chunks

173

return response.raw.read_chunked(amt=1024 * 256)

183

return response.raw.read_chunked(amt=1024 * 256)

174

else:

184

else:

175

return [response.content]

185

return [response.content]

176

186

177

187

178

def _is_chunked(response):

188

def _is_chunked(response):

179

return response.headers.get('Transfer-Encoding', '') == 'chunked'

189

return response.headers.get('Transfer-Encoding', '') == 'chunked'

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # -*- coding: utf-8 -*-
             # Copyright (C) 2014-2020 RhodeCode GmbH
             #
             # This program is free software: you can redistribute it and/or modify
             # it under the terms of the GNU Affero General Public License, version 3
             # (only), as published by the Free Software Foundation.
             #
             # This program is distributed in the hope that it will be useful,
             # but WITHOUT ANY WARRANTY; without even the implied warranty of
             # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
             # GNU General Public License for more details.
             #
             # You should have received a copy of the GNU Affero General Public License
             # along with this program.  If not, see <http://www.gnu.org/licenses/>.
             #
             # This program is dual-licensed. If you wish to learn more about the
             # RhodeCode Enterprise Edition, including its added features, Support services,
             # and proprietary license terms, please see https://rhodecode.com/licenses/
             """
             Implementation of the scm_app interface using raw HTTP communication.
             """
             import base64
             import logging
             import urlparse
             import wsgiref.util
             import msgpack
             import requests
             import webob.request
             import rhodecode
             log = logging.getLogger(__name__)
             def create_git_wsgi_app(repo_path, repo_name, config):
                 url = _vcs_streaming_url() + 'git/'
                 return VcsHttpProxy(url, repo_path, repo_name, config)
             def create_hg_wsgi_app(repo_path, repo_name, config):
                 url = _vcs_streaming_url() + 'hg/'
                 return VcsHttpProxy(url, repo_path, repo_name, config)
             def _vcs_streaming_url():
                 template = 'http://{}/stream/'
                 return template.format(rhodecode.CONFIG['vcs.server'])
             # TODO: johbo: Avoid the global.
             session = requests.Session()
             # Requests speedup, avoid reading .netrc and similar
             session.trust_env = False
             # prevent urllib3 spawning our logs.
             logging.getLogger("requests.packages.urllib3.connectionpool").setLevel(
                 logging.WARNING)
             class VcsHttpProxy(object):
                 """
                 A WSGI application which proxies vcs requests.
                 The goal is to shuffle the data around without touching it. The only
                 exception is the extra data from the config object which we send to the
                 server as well.
                 """
                 def __init__(self, url, repo_path, repo_name, config):
                     """
                     :param str url: The URL of the VCSServer to call.
                     """
                     self._url = url
                     self._repo_name = repo_name
                     self._repo_path = repo_path
                     self._config = config
+                    self.rc_extras = {}
                     log.debug(
                         "Creating VcsHttpProxy for repo %s, url %s",
                         repo_name, url)
                 def __call__(self, environ, start_response):
                     config = msgpack.packb(self._config)
                     request = webob.request.Request(environ)
                     request_headers = request.headers
                     request_headers.update({
                         # TODO: johbo: Remove this, rely on URL path only
                         'X-RC-Repo-Name': self._repo_name,
                         'X-RC-Repo-Path': self._repo_path,
                         'X-RC-Path-Info': environ['PATH_INFO'],
+                        'X-RC-Repo-Store': self.rc_extras.get('repo_store'),
+                        'X-RC-Server-Config-File': self.rc_extras.get('config'),
+                        'X-RC-Auth-User': self.rc_extras.get('username'),
+                        'X-RC-Auth-User-Id': self.rc_extras.get('user_id'),
+                        'X-RC-Auth-User-Ip': self.rc_extras.get('ip'),
                         # TODO: johbo: Avoid encoding and put this into payload?
                         'X-RC-Repo-Config': base64.b64encode(config),
-                        'X-RC-Locked-Status-Code': rhodecode.CONFIG.get('lock_ret_code')
+                        'X-RC-Locked-Status-Code': rhodecode.CONFIG.get('lock_ret_code'),
                     })
                     method = environ['REQUEST_METHOD']
                     # Preserve the query string
                     url = self._url
                     url = urlparse.urljoin(url, self._repo_name)
                     if environ.get('QUERY_STRING'):
                         url += '?' + environ['QUERY_STRING']
                     log.debug('http-app: preparing request to: %s', url)
                     response = session.request(
                         method,
                         url,
                         data=_maybe_stream_request(environ),
                         headers=request_headers,
                         stream=True)
                     log.debug('http-app: got vcsserver response: %s', response)
                     if response.status_code >= 500:
                         log.error('Exception returned by vcsserver at: %s %s, %s',
                                   url, response.status_code, response.content)
                     # Preserve the headers of the response, except hop_by_hop ones
                     response_headers = [
                         (h, v) for h, v in response.headers.items()
                         if not wsgiref.util.is_hop_by_hop(h)
                     ]
                     # Build status argument for start_response callable.
                     status = '{status_code} {reason_phrase}'.format(
                         status_code=response.status_code,
                         reason_phrase=response.reason)
                     start_response(status, response_headers)
                     return _maybe_stream_response(response)
             def read_in_chunks(stream_obj, block_size=1024, chunks=-1):
                 """
                 Read Stream in chunks, default chunk size: 1k.
                 """
                 while chunks:
                     data = stream_obj.read(block_size)
                     if not data:
                         break
                     yield data
                     chunks -= 1
             def _is_request_chunked(environ):
                 stream = environ.get('HTTP_TRANSFER_ENCODING', '') == 'chunked'
                 return stream
             def _maybe_stream_request(environ):
                 path = environ['PATH_INFO']
                 stream = _is_request_chunked(environ)
                 log.debug('handling request `%s` with stream support: %s', path, stream)
                 if stream:
                     # set stream by 256k
                     return read_in_chunks(environ['wsgi.input'], block_size=1024 * 256)
                 else:
                     return environ['wsgi.input'].read()
             def _maybe_stream_response(response):
                 """
                 Try to generate chunks from the response if it is chunked.
                 """
                 stream = _is_chunked(response)
                 log.debug('returning response with stream: %s', stream)
                 if stream:
                     # read in 256k Chunks
                     return response.raw.read_chunked(amt=1024 * 256)
                 else:
                     return [response.content]
             def _is_chunked(response):
                 return response.headers.get('Transfer-Encoding', '') == 'chunked'