rhodecode-enterprise-ce Commit - r1529:3683d343

1

# -*- coding: utf-8 -*-

1

# -*- coding: utf-8 -*-

2

3

4

#

4

#

5

# This program is free software: you can redistribute it and/or modify

5

# This program is free software: you can redistribute it and/or modify

6

# it under the terms of the GNU Affero General Public License, version 3

6

# it under the terms of the GNU Affero General Public License, version 3

7

# (only), as published by the Free Software Foundation.

7

# (only), as published by the Free Software Foundation.

8

#

8

#

9

# This program is distributed in the hope that it will be useful,

9

# This program is distributed in the hope that it will be useful,

10

# but WITHOUT ANY WARRANTY; without even the implied warranty of

10

# but WITHOUT ANY WARRANTY; without even the implied warranty of

11

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

11

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

12

# GNU General Public License for more details.

12

# GNU General Public License for more details.

13

#

13

#

14

# You should have received a copy of the GNU Affero General Public License

14

# You should have received a copy of the GNU Affero General Public License

15

# along with this program. If not, see <http://www.gnu.org/licenses/>.

15

# along with this program. If not, see <http://www.gnu.org/licenses/>.

16

#

16

#

17

# This program is dual-licensed. If you wish to learn more about the

17

# This program is dual-licensed. If you wish to learn more about the

18

# RhodeCode Enterprise Edition, including its added features, Support services,

18

# RhodeCode Enterprise Edition, including its added features, Support services,

19

# and proprietary license terms, please see https://rhodecode.com/licenses/

19

# and proprietary license terms, please see https://rhodecode.com/licenses/

20

21

22

"""

22

"""

23

Renderer for markup languages with ability to parse using rst or markdown

23

Renderer for markup languages with ability to parse using rst or markdown

24

"""

24

"""

25

26

import re

26

import re

27

import os

27

import os

28

import lxml

28

import lxml

29

import logging

29

import logging

30

import urlparse

30

import urlparse

31

import urllib

32

31

33

from mako.lookup import TemplateLookup

32

from mako.lookup import TemplateLookup

34

from mako.template import Template as MakoTemplate

33

from mako.template import Template as MakoTemplate

35

34

36

from docutils.core import publish_parts

35

from docutils.core import publish_parts

37

from docutils.parsers.rst import directives

36

from docutils.parsers.rst import directives

38

import markdown

37

import markdown

39

38

40

from rhodecode.lib.markdown_ext import GithubFlavoredMarkdownExtension

39

from rhodecode.lib.markdown_ext import GithubFlavoredMarkdownExtension

41

from rhodecode.lib.utils2 import (

40

from rhodecode.lib.utils2 import (

42

safe_str, safe_unicode, md5_safe, MENTIONS_REGEX)

41

safe_str, safe_unicode, md5_safe, MENTIONS_REGEX)

43

42

44

log = logging.getLogger(__name__)

43

log = logging.getLogger(__name__)

45

44

46

# default renderer used to generate automated comments

45

# default renderer used to generate automated comments

47

DEFAULT_COMMENTS_RENDERER = 'rst'

46

DEFAULT_COMMENTS_RENDERER = 'rst'

48

47

49

48

50

def relative_links(html_source, server_path):

49

def relative_links(html_source, server_path):

51

doc = lxml.html.fromstring(html_source)

50

if not html_source:

51

return html_source

52

53

try:

54

doc = lxml.html.fromstring(html_source)

55

except Exception:

56

return html_source

57

52

for el in doc.cssselect('img, video'):

58

for el in doc.cssselect('img, video'):

53

src = el.attrib['src']

59

src = el.attrib['src']

54

if src:

60

if src:

55

el.attrib['src'] = relative_path(src, server_path)

61

el.attrib['src'] = relative_path(src, server_path)

56

62

57

for el in doc.cssselect('a:not(.gfm)'):

63

for el in doc.cssselect('a:not(.gfm)'):

58

src = el.attrib['href']

64

src = el.attrib['href']

59

if src:

65

if src:

60

el.attrib['href'] = relative_path(src, server_path)

66

el.attrib['href'] = relative_path(src, server_path)

61

67

62

return lxml.html.tostring(doc)

68

return lxml.html.tostring(doc)

63

69

64

70

65

def relative_path(path, request_path, is_repo_file=None):

71

def relative_path(path, request_path, is_repo_file=None):

66

"""

72

"""

67

relative link support, path is a rel path, and request_path is current

73

relative link support, path is a rel path, and request_path is current

68

server path (not absolute)

74

server path (not absolute)

69

75

70

e.g.

76

e.g.

71

77

72

path = '../logo.png'

78

path = '../logo.png'

73

request_path= '/repo/files/path/file.md'

79

request_path= '/repo/files/path/file.md'

74

produces: '/repo/files/logo.png'

80

produces: '/repo/files/logo.png'

75

"""

81

"""

76

# TODO(marcink): unicode/str support ?

82

# TODO(marcink): unicode/str support ?

77

# maybe=> safe_unicode(urllib.quote(safe_str(final_path), '/:'))

83

# maybe=> safe_unicode(urllib.quote(safe_str(final_path), '/:'))

78

84

79

def dummy_check(p):

85

def dummy_check(p):

80

return True # assume default is a valid file path

86

return True # assume default is a valid file path

81

87

82

is_repo_file = is_repo_file or dummy_check

88

is_repo_file = is_repo_file or dummy_check

83

if not path:

89

if not path:

84

return request_path

90

return request_path

85

91

86

path = safe_unicode(path)

92

path = safe_unicode(path)

87

request_path = safe_unicode(request_path)

93

request_path = safe_unicode(request_path)

88

94

89

if path.startswith((u'data:', u'#', u':')):

95

if path.startswith((u'data:', u'javascript:', u'#', u':')):

90

# skip data, anchor, invalid links

96

# skip data, anchor, invalid links

91

return path

97

return path

92

98

93

is_absolute = bool(urlparse.urlparse(path).netloc)

99

is_absolute = bool(urlparse.urlparse(path).netloc)

94

if is_absolute:

100

if is_absolute:

95

return path

101

return path

96

102

97

if not request_path:

103

if not request_path:

98

return path

104

return path

99

105

100

if path.startswith(u'/'):

106

if path.startswith(u'/'):

101

path = path[1:]

107

path = path[1:]

102

108

103

if path.startswith(u'./'):

109

if path.startswith(u'./'):

104

path = path[2:]

110

path = path[2:]

105

111

106

parts = request_path.split('/')

112

parts = request_path.split('/')

107

# compute how deep we need to traverse the request_path

113

# compute how deep we need to traverse the request_path

108

depth = 0

114

depth = 0

109

115

110

if is_repo_file(request_path):

116

if is_repo_file(request_path):

111

# if request path is a VALID file, we use a relative path with

117

# if request path is a VALID file, we use a relative path with

112

# one level up

118

# one level up

113

depth += 1

119

depth += 1

114

120

115

while path.startswith(u'../'):

121

while path.startswith(u'../'):

116

depth += 1

122

depth += 1

117

path = path[3:]

123

path = path[3:]

118

124

119

if depth > 0:

125

if depth > 0:

120

parts = parts[:-depth]

126

parts = parts[:-depth]

121

127

122

parts.append(path)

128

parts.append(path)

123

final_path = u'/'.join(parts).lstrip(u'/')

129

final_path = u'/'.join(parts).lstrip(u'/')

124

130

125

return u'/' + final_path

131

return u'/' + final_path

126

132

127

133

128

class MarkupRenderer(object):

134

class MarkupRenderer(object):

129

RESTRUCTUREDTEXT_DISALLOWED_DIRECTIVES = ['include', 'meta', 'raw']

135

RESTRUCTUREDTEXT_DISALLOWED_DIRECTIVES = ['include', 'meta', 'raw']

130

136

131

MARKDOWN_PAT = re.compile(r'\.(md|mkdn?|mdown|markdown)$', re.IGNORECASE)

137

MARKDOWN_PAT = re.compile(r'\.(md|mkdn?|mdown|markdown)$', re.IGNORECASE)

132

RST_PAT = re.compile(r'\.re?st$', re.IGNORECASE)

138

RST_PAT = re.compile(r'\.re?st$', re.IGNORECASE)

133

JUPYTER_PAT = re.compile(r'\.(ipynb)$', re.IGNORECASE)

139

JUPYTER_PAT = re.compile(r'\.(ipynb)$', re.IGNORECASE)

134

PLAIN_PAT = re.compile(r'^readme$', re.IGNORECASE)

140

PLAIN_PAT = re.compile(r'^readme$', re.IGNORECASE)

135

141

136

extensions = ['codehilite', 'extra', 'def_list', 'sane_lists']

142

extensions = ['codehilite', 'extra', 'def_list', 'sane_lists']

137

markdown_renderer = markdown.Markdown(

143

markdown_renderer = markdown.Markdown(

138

extensions, safe_mode=True, enable_attributes=False)

144

extensions, safe_mode=True, enable_attributes=False)

139

145

140

markdown_renderer_flavored = markdown.Markdown(

146

markdown_renderer_flavored = markdown.Markdown(

141

extensions + [GithubFlavoredMarkdownExtension()], safe_mode=True,

147

extensions + [GithubFlavoredMarkdownExtension()], safe_mode=True,

142

enable_attributes=False)

148

enable_attributes=False)

143

149

144

# extension together with weights. Lower is first means we control how

150

# extension together with weights. Lower is first means we control how

145

# extensions are attached to readme names with those.

151

# extensions are attached to readme names with those.

146

PLAIN_EXTS = [

152

PLAIN_EXTS = [

147

# prefer no extension

153

# prefer no extension

148

('', 0), # special case that renders READMES names without extension

154

('', 0), # special case that renders READMES names without extension

149

('.text', 2), ('.TEXT', 2),

155

('.text', 2), ('.TEXT', 2),

150

('.txt', 3), ('.TXT', 3)

156

('.txt', 3), ('.TXT', 3)

151

]

157

]

152

158

153

RST_EXTS = [

159

RST_EXTS = [

154

('.rst', 1), ('.rest', 1),

160

('.rst', 1), ('.rest', 1),

155

('.RST', 2), ('.REST', 2)

161

('.RST', 2), ('.REST', 2)

156

]

162

]

157

163

158

MARKDOWN_EXTS = [

164

MARKDOWN_EXTS = [

159

('.md', 1), ('.MD', 1),

165

('.md', 1), ('.MD', 1),

160

('.mkdn', 2), ('.MKDN', 2),

166

('.mkdn', 2), ('.MKDN', 2),

161

('.mdown', 3), ('.MDOWN', 3),

167

('.mdown', 3), ('.MDOWN', 3),

162

('.markdown', 4), ('.MARKDOWN', 4)

168

('.markdown', 4), ('.MARKDOWN', 4)

163

]

169

]

164

170

165

def _detect_renderer(self, source, filename=None):

171

def _detect_renderer(self, source, filename=None):

166

"""

172

"""

167

runs detection of what renderer should be used for generating html

173

runs detection of what renderer should be used for generating html

168

from a markup language

174

from a markup language

169

175

170

filename can be also explicitly a renderer name

176

filename can be also explicitly a renderer name

171

177

172

:param source:

178

:param source:

173

:param filename:

179

:param filename:

174

"""

180

"""

175

181

176

if MarkupRenderer.MARKDOWN_PAT.findall(filename):

182

if MarkupRenderer.MARKDOWN_PAT.findall(filename):

177

detected_renderer = 'markdown'

183

detected_renderer = 'markdown'

178

elif MarkupRenderer.RST_PAT.findall(filename):

184

elif MarkupRenderer.RST_PAT.findall(filename):

179

detected_renderer = 'rst'

185

detected_renderer = 'rst'

180

elif MarkupRenderer.JUPYTER_PAT.findall(filename):

186

elif MarkupRenderer.JUPYTER_PAT.findall(filename):

181

detected_renderer = 'jupyter'

187

detected_renderer = 'jupyter'

182

elif MarkupRenderer.PLAIN_PAT.findall(filename):

188

elif MarkupRenderer.PLAIN_PAT.findall(filename):

183

detected_renderer = 'plain'

189

detected_renderer = 'plain'

184

else:

190

else:

185

detected_renderer = 'plain'

191

detected_renderer = 'plain'

186

192

187

return getattr(MarkupRenderer, detected_renderer)

193

return getattr(MarkupRenderer, detected_renderer)

188

194

189

@classmethod

195

@classmethod

190

def renderer_from_filename(cls, filename, exclude):

196

def renderer_from_filename(cls, filename, exclude):

191

"""

197

"""

192

Detect renderer markdown/rst from filename and optionally use exclude

198

Detect renderer markdown/rst from filename and optionally use exclude

193

list to remove some options. This is mostly used in helpers.

199

list to remove some options. This is mostly used in helpers.

194

Returns None when no renderer can be detected.

200

Returns None when no renderer can be detected.

195

"""

201

"""

196

def _filter(elements):

202

def _filter(elements):

197

if isinstance(exclude, (list, tuple)):

203

if isinstance(exclude, (list, tuple)):

198

return [x for x in elements if x not in exclude]

204

return [x for x in elements if x not in exclude]

199

return elements

205

return elements

200

206

201

if filename.endswith(

207

if filename.endswith(

202

tuple(_filter([x[0] for x in cls.MARKDOWN_EXTS if x[0]]))):

208

tuple(_filter([x[0] for x in cls.MARKDOWN_EXTS if x[0]]))):

203

return 'markdown'

209

return 'markdown'

204

if filename.endswith(tuple(_filter([x[0] for x in cls.RST_EXTS if x[0]]))):

210

if filename.endswith(tuple(_filter([x[0] for x in cls.RST_EXTS if x[0]]))):

205

return 'rst'

211

return 'rst'

206

212

207

return None

213

return None

208

214

209

def render(self, source, filename=None):

215

def render(self, source, filename=None):

210

"""

216

"""

211

Renders a given filename using detected renderer

217

Renders a given filename using detected renderer

212

it detects renderers based on file extension or mimetype.

218

it detects renderers based on file extension or mimetype.

213

At last it will just do a simple html replacing new lines with <br/>

219

At last it will just do a simple html replacing new lines with <br/>

214

220

215

:param file_name:

221

:param file_name:

216

:param source:

222

:param source:

217

"""

223

"""

218

224

219

renderer = self._detect_renderer(source, filename)

225

renderer = self._detect_renderer(source, filename)

220

readme_data = renderer(source)

226

readme_data = renderer(source)

221

return readme_data

227

return readme_data

222

228

223

@classmethod

229

@classmethod

224

def _flavored_markdown(cls, text):

230

def _flavored_markdown(cls, text):

225

"""

231

"""

226

Github style flavored markdown

232

Github style flavored markdown

227

233

228

:param text:

234

:param text:

229

"""

235

"""

230

236

231

# Extract pre blocks.

237

# Extract pre blocks.

232

extractions = {}

238

extractions = {}

233

239

234

def pre_extraction_callback(matchobj):

240

def pre_extraction_callback(matchobj):

235

digest = md5_safe(matchobj.group(0))

241

digest = md5_safe(matchobj.group(0))

236

extractions[digest] = matchobj.group(0)

242

extractions[digest] = matchobj.group(0)

237

return "{gfm-extraction-%s}" % digest

243

return "{gfm-extraction-%s}" % digest

238

pattern = re.compile(r'<pre>.*?</pre>', re.MULTILINE | re.DOTALL)

244

pattern = re.compile(r'<pre>.*?</pre>', re.MULTILINE | re.DOTALL)

239

text = re.sub(pattern, pre_extraction_callback, text)

245

text = re.sub(pattern, pre_extraction_callback, text)

240

246

241

# Prevent foo_bar_baz from ending up with an italic word in the middle.

247

# Prevent foo_bar_baz from ending up with an italic word in the middle.

242

def italic_callback(matchobj):

248

def italic_callback(matchobj):

243

s = matchobj.group(0)

249

s = matchobj.group(0)

244

if list(s).count('_') >= 2:

250

if list(s).count('_') >= 2:

245

return s.replace('_', r'\_')

251

return s.replace('_', r'\_')

246

return s

252

return s

247

text = re.sub(r'^(?! {4}|\t)\w+_\w+_\w[\w_]*', italic_callback, text)

253

text = re.sub(r'^(?! {4}|\t)\w+_\w+_\w[\w_]*', italic_callback, text)

248

254

249

# Insert pre block extractions.

255

# Insert pre block extractions.

250

def pre_insert_callback(matchobj):

256

def pre_insert_callback(matchobj):

251

return '\n\n' + extractions[matchobj.group(1)]

257

return '\n\n' + extractions[matchobj.group(1)]

252

text = re.sub(r'\{gfm-extraction-([0-9a-f]{32})\}',

258

text = re.sub(r'\{gfm-extraction-([0-9a-f]{32})\}',

253

pre_insert_callback, text)

259

pre_insert_callback, text)

254

260

255

return text

261

return text

256

262

257

@classmethod

263

@classmethod

258

def urlify_text(cls, text):

264

def urlify_text(cls, text):

259

url_pat = re.compile(r'(http[s]?://(?:[a-zA-Z]|[0-9]|[$-_@.&+]'

265

url_pat = re.compile(r'(http[s]?://(?:[a-zA-Z]|[0-9]|[$-_@.&+]'

260

r'|[!*,]|(?:%[0-9a-fA-F][0-9a-fA-F]))+)')

266

r'|[!*,]|(?:%[0-9a-fA-F][0-9a-fA-F]))+)')

261

267

262

def url_func(match_obj):

268

def url_func(match_obj):

263

url_full = match_obj.groups()[0]

269

url_full = match_obj.groups()[0]

264

return '<a href="%(url)s">%(url)s</a>' % ({'url': url_full})

270

return '<a href="%(url)s">%(url)s</a>' % ({'url': url_full})

265

271

266

return url_pat.sub(url_func, text)

272

return url_pat.sub(url_func, text)

267

273

268

@classmethod

274

@classmethod

269

def plain(cls, source, universal_newline=True):

275

def plain(cls, source, universal_newline=True):

270

source = safe_unicode(source)

276

source = safe_unicode(source)

271

if universal_newline:

277

if universal_newline:

272

newline = '\n'

278

newline = '\n'

273

source = newline.join(source.splitlines())

279

source = newline.join(source.splitlines())

274

280

275

source = cls.urlify_text(source)

281

source = cls.urlify_text(source)

276

return '<br />' + source.replace("\n", '<br />')

282

return '<br />' + source.replace("\n", '<br />')

277

283

278

@classmethod

284

@classmethod

279

def markdown(cls, source, safe=True, flavored=True, mentions=False):

285

def markdown(cls, source, safe=True, flavored=True, mentions=False):

280

# It does not allow to insert inline HTML. In presence of HTML tags, it

286

# It does not allow to insert inline HTML. In presence of HTML tags, it

281

# will replace them instead with [HTML_REMOVED]. This is controlled by

287

# will replace them instead with [HTML_REMOVED]. This is controlled by

282

# the safe_mode=True parameter of the markdown method.

288

# the safe_mode=True parameter of the markdown method.

283

289

284

if flavored:

290

if flavored:

285

markdown_renderer = cls.markdown_renderer_flavored

291

markdown_renderer = cls.markdown_renderer_flavored

286

else:

292

else:

287

markdown_renderer = cls.markdown_renderer

293

markdown_renderer = cls.markdown_renderer

288

294

289

if mentions:

295

if mentions:

290

mention_pat = re.compile(MENTIONS_REGEX)

296

mention_pat = re.compile(MENTIONS_REGEX)

291

297

292

def wrapp(match_obj):

298

def wrapp(match_obj):

293

uname = match_obj.groups()[0]

299

uname = match_obj.groups()[0]

294

return ' **@%(uname)s** ' % {'uname': uname}

300

return ' **@%(uname)s** ' % {'uname': uname}

295

mention_hl = mention_pat.sub(wrapp, source).strip()

301

mention_hl = mention_pat.sub(wrapp, source).strip()

296

# we extracted mentions render with this using Mentions false

302

# we extracted mentions render with this using Mentions false

297

return cls.markdown(mention_hl, safe=safe, flavored=flavored,

303

return cls.markdown(mention_hl, safe=safe, flavored=flavored,

298

mentions=False)

304

mentions=False)

299

305

300

source = safe_unicode(source)

306

source = safe_unicode(source)

301

try:

307

try:

302

if flavored:

308

if flavored:

303

source = cls._flavored_markdown(source)

309

source = cls._flavored_markdown(source)

304

return markdown_renderer.convert(source)

310

return markdown_renderer.convert(source)

305

except Exception:

311

except Exception:

306

log.exception('Error when rendering Markdown')

312

log.exception('Error when rendering Markdown')

307

if safe:

313

if safe:

308

log.debug('Fallback to render in plain mode')

314

log.debug('Fallback to render in plain mode')

309

return cls.plain(source)

315

return cls.plain(source)

310

else:

316

else:

311

raise

317

raise

312

318

313

@classmethod

319

@classmethod

314

def rst(cls, source, safe=True, mentions=False):

320

def rst(cls, source, safe=True, mentions=False):

315

if mentions:

321

if mentions:

316

mention_pat = re.compile(MENTIONS_REGEX)

322

mention_pat = re.compile(MENTIONS_REGEX)

317

323

318

def wrapp(match_obj):

324

def wrapp(match_obj):

319

uname = match_obj.groups()[0]

325

uname = match_obj.groups()[0]

320

return ' **@%(uname)s** ' % {'uname': uname}

326

return ' **@%(uname)s** ' % {'uname': uname}

321

mention_hl = mention_pat.sub(wrapp, source).strip()

327

mention_hl = mention_pat.sub(wrapp, source).strip()

322

# we extracted mentions render with this using Mentions false

328

# we extracted mentions render with this using Mentions false

323

return cls.rst(mention_hl, safe=safe, mentions=False)

329

return cls.rst(mention_hl, safe=safe, mentions=False)

324

330

325

source = safe_unicode(source)

331

source = safe_unicode(source)

326

try:

332

try:

327

docutils_settings = dict(

333

docutils_settings = dict(

328

[(alias, None) for alias in

334

[(alias, None) for alias in

329

cls.RESTRUCTUREDTEXT_DISALLOWED_DIRECTIVES])

335

cls.RESTRUCTUREDTEXT_DISALLOWED_DIRECTIVES])

330

336

331

docutils_settings.update({'input_encoding': 'unicode',

337

docutils_settings.update({'input_encoding': 'unicode',

332

'report_level': 4})

338

'report_level': 4})

333

339

334

for k, v in docutils_settings.iteritems():

340

for k, v in docutils_settings.iteritems():

335

directives.register_directive(k, v)

341

directives.register_directive(k, v)

336

342

337

parts = publish_parts(source=source,

343

parts = publish_parts(source=source,

338

writer_name="html4css1",

344

writer_name="html4css1",

339

settings_overrides=docutils_settings)

345

settings_overrides=docutils_settings)

340

346

341

return parts['html_title'] + parts["fragment"]

347

return parts['html_title'] + parts["fragment"]

342

except Exception:

348

except Exception:

343

log.exception('Error when rendering RST')

349

log.exception('Error when rendering RST')

344

if safe:

350

if safe:

345

log.debug('Fallbacking to render in plain mode')

351

log.debug('Fallbacking to render in plain mode')

346

return cls.plain(source)

352

return cls.plain(source)

347

else:

353

else:

348

raise

354

raise

349

355

350

@classmethod

356

@classmethod

351

def jupyter(cls, source, safe=True):

357

def jupyter(cls, source, safe=True):

352

from rhodecode.lib import helpers

358

from rhodecode.lib import helpers

353

359

354

from traitlets.config import Config

360

from traitlets.config import Config

355

import nbformat

361

import nbformat

356

from nbconvert import HTMLExporter

362

from nbconvert import HTMLExporter

357

from nbconvert.preprocessors import Preprocessor

363

from nbconvert.preprocessors import Preprocessor

358

364

359

class CustomHTMLExporter(HTMLExporter):

365

class CustomHTMLExporter(HTMLExporter):

360

def _template_file_default(self):

366

def _template_file_default(self):

361

return 'basic'

367

return 'basic'

362

368

363

class Sandbox(Preprocessor):

369

class Sandbox(Preprocessor):

364

370

365

def preprocess(self, nb, resources):

371

def preprocess(self, nb, resources):

366

sandbox_text = 'SandBoxed(IPython.core.display.Javascript object)'

372

sandbox_text = 'SandBoxed(IPython.core.display.Javascript object)'

367

for cell in nb['cells']:

373

for cell in nb['cells']:

368

if safe and 'outputs' in cell:

374

if safe and 'outputs' in cell:

369

for cell_output in cell['outputs']:

375

for cell_output in cell['outputs']:

370

if 'data' in cell_output:

376

if 'data' in cell_output:

371

if 'application/javascript' in cell_output['data']:

377

if 'application/javascript' in cell_output['data']:

372

cell_output['data']['text/plain'] = sandbox_text

378

cell_output['data']['text/plain'] = sandbox_text

373

cell_output['data'].pop('application/javascript', None)

379

cell_output['data'].pop('application/javascript', None)

374

return nb, resources

380

return nb, resources

375

381

376

def _sanitize_resources(resources):

382

def _sanitize_resources(resources):

377

"""

383

"""

378

Skip/sanitize some of the CSS generated and included in jupyter

384

Skip/sanitize some of the CSS generated and included in jupyter

379

so it doesn't messes up UI so much

385

so it doesn't messes up UI so much

380

"""

386

"""

381

387

382

# TODO(marcink): probably we should replace this with whole custom

388

# TODO(marcink): probably we should replace this with whole custom

383

# CSS set that doesn't screw up, but jupyter generated html has some

389

# CSS set that doesn't screw up, but jupyter generated html has some

384

# special markers, so it requires Custom HTML exporter template with

390

# special markers, so it requires Custom HTML exporter template with

385

# _default_template_path_default, to achieve that

391

# _default_template_path_default, to achieve that

386

392

387

# strip the reset CSS

393

# strip the reset CSS

388

resources[0] = resources[0][resources[0].find('/*! Source'):]

394

resources[0] = resources[0][resources[0].find('/*! Source'):]

389

return resources

395

return resources

390

396

391

def as_html(notebook):

397

def as_html(notebook):

392

conf = Config()

398

conf = Config()

393

conf.CustomHTMLExporter.preprocessors = [Sandbox]

399

conf.CustomHTMLExporter.preprocessors = [Sandbox]

394

html_exporter = CustomHTMLExporter(config=conf)

400

html_exporter = CustomHTMLExporter(config=conf)

395

401

396

(body, resources) = html_exporter.from_notebook_node(notebook)

402

(body, resources) = html_exporter.from_notebook_node(notebook)

397

header = ''

403

header = ''

398

js = MakoTemplate(r'''

404

js = MakoTemplate(r'''

399

405

400

406

401

407

402

MathJax.Hub.Config({

408

MathJax.Hub.Config({

403

jax: ["input/TeX","output/HTML-CSS", "output/PreviewHTML"],

409

jax: ["input/TeX","output/HTML-CSS", "output/PreviewHTML"],

404

extensions: ["tex2jax.js","MathMenu.js","MathZoom.js", "fast-preview.js", "AssistiveMML.js", "[Contrib]/a11y/accessibility-menu.js"],

410

extensions: ["tex2jax.js","MathMenu.js","MathZoom.js", "fast-preview.js", "AssistiveMML.js", "[Contrib]/a11y/accessibility-menu.js"],

405

TeX: {

411

TeX: {

406

extensions: ["AMSmath.js","AMSsymbols.js","noErrors.js","noUndefined.js"]

412

extensions: ["AMSmath.js","AMSsymbols.js","noErrors.js","noUndefined.js"]

407

},

413

},

408

tex2jax: {

414

tex2jax: {

409

inlineMath: [ ['$','$'], ["\$","\$"] ],

415

inlineMath: [ ['$','$'], ["\$","\$"] ],

410

displayMath: [ ['$$','$$'], ["\\[","\\]"] ],

416

displayMath: [ ['$$','$$'], ["\\[","\\]"] ],

411

processEscapes: true,

417

processEscapes: true,

412

processEnvironments: true

418

processEnvironments: true

413

},

419

},

414

// Center justify equations in code and markdown cells. Elsewhere

420

// Center justify equations in code and markdown cells. Elsewhere

415

// we use CSS to left justify single line equations in code cells.

421

// we use CSS to left justify single line equations in code cells.

416

displayAlign: 'center',

422

displayAlign: 'center',

417

"HTML-CSS": {

423

"HTML-CSS": {

418

styles: {'.MathJax_Display': {"margin": 0}},

424

styles: {'.MathJax_Display': {"margin": 0}},

419

linebreaks: { automatic: true },

425

linebreaks: { automatic: true },

420

availableFonts: ["STIX", "TeX"]

426

availableFonts: ["STIX", "TeX"]

421

},

427

},

422

showMathMenu: false

428

showMathMenu: false

423

});

429

});

424

</script>

430

</script>

425

431

426

432

427

''').render(h=helpers)

433

''').render(h=helpers)

428

434

429

css = '<style>{}</style>'.format(

435

css = '<style>{}</style>'.format(

430

''.join(_sanitize_resources(resources['inlining']['css'])))

436

''.join(_sanitize_resources(resources['inlining']['css'])))

431

437

432

body = '\n'.join([header, css, js, body])

438

body = '\n'.join([header, css, js, body])

433

return body, resources

439

return body, resources

434

440

435

notebook = nbformat.reads(source, as_version=4)

441

notebook = nbformat.reads(source, as_version=4)

436

(body, resources) = as_html(notebook)

442

(body, resources) = as_html(notebook)

437

return body

443

return body

438

444

439

445

440

class RstTemplateRenderer(object):

446

class RstTemplateRenderer(object):

441

447

442

def __init__(self):

448

def __init__(self):

443

base = os.path.abspath(os.path.dirname(os.path.dirname(__file__)))

449

base = os.path.abspath(os.path.dirname(os.path.dirname(__file__)))

444

rst_template_dirs = [os.path.join(base, 'templates', 'rst_templates')]

450

rst_template_dirs = [os.path.join(base, 'templates', 'rst_templates')]

445

self.template_store = TemplateLookup(

451

self.template_store = TemplateLookup(

446

directories=rst_template_dirs,

452

directories=rst_template_dirs,

447

input_encoding='utf-8',

453

input_encoding='utf-8',

448

imports=['from rhodecode.lib import helpers as h'])

454

imports=['from rhodecode.lib import helpers as h'])

449

455

450

def _get_template(self, templatename):

456

def _get_template(self, templatename):

451

return self.template_store.get_template(templatename)

457

return self.template_store.get_template(templatename)

452

458

453

def render(self, template_name, **kwargs):

459

def render(self, template_name, **kwargs):

454

template = self._get_template(template_name)

460

template = self._get_template(template_name)

455

return template.render(**kwargs)

461

return template.render(**kwargs)

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # -*- coding: utf-8 -*-
             # Copyright (C) 2011-2017 RhodeCode GmbH
             #
             # This program is free software: you can redistribute it and/or modify
             # it under the terms of the GNU Affero General Public License, version 3
             # (only), as published by the Free Software Foundation.
             #
             # This program is distributed in the hope that it will be useful,
             # but WITHOUT ANY WARRANTY; without even the implied warranty of
             # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
             # GNU General Public License for more details.
             #
             # You should have received a copy of the GNU Affero General Public License
             # along with this program.  If not, see <http://www.gnu.org/licenses/>.
             #
             # This program is dual-licensed. If you wish to learn more about the
             # RhodeCode Enterprise Edition, including its added features, Support services,
             # and proprietary license terms, please see https://rhodecode.com/licenses/
             """
             Renderer for markup languages with ability to parse using rst or markdown
             """
             import re
             import os
             import lxml
             import logging
             import urlparse
-            import urllib
             from mako.lookup import TemplateLookup
             from mako.template import Template as MakoTemplate
             from docutils.core import publish_parts
             from docutils.parsers.rst import directives
             import markdown
             from rhodecode.lib.markdown_ext import GithubFlavoredMarkdownExtension
             from rhodecode.lib.utils2 import (
                 safe_str, safe_unicode, md5_safe, MENTIONS_REGEX)
             log = logging.getLogger(__name__)
             # default renderer used to generate automated comments
             DEFAULT_COMMENTS_RENDERER = 'rst'
             def relative_links(html_source, server_path):
-                doc = lxml.html.fromstring(html_source)
+                if not html_source:
+                    return html_source
+                try:
+                    doc = lxml.html.fromstring(html_source)
+                except Exception:
+                    return html_source
                 for el in doc.cssselect('img, video'):
                     src = el.attrib['src']
                     if src:
                         el.attrib['src'] = relative_path(src, server_path)
                 for el in doc.cssselect('a:not(.gfm)'):
                     src = el.attrib['href']
                     if src:
                         el.attrib['href'] = relative_path(src, server_path)
                 return lxml.html.tostring(doc)
             def relative_path(path, request_path, is_repo_file=None):
                 """
                 relative link support, path is a rel path, and request_path is current
                 server path (not absolute)
                 e.g.
                 path = '../logo.png'
                 request_path= '/repo/files/path/file.md'
                 produces: '/repo/files/logo.png'
                 """
                 # TODO(marcink): unicode/str support ?
                 # maybe=> safe_unicode(urllib.quote(safe_str(final_path), '/:'))
                 def dummy_check(p):
                     return True  # assume default is a valid file path
                 is_repo_file = is_repo_file or dummy_check
                 if not path:
                     return request_path
                 path = safe_unicode(path)
                 request_path = safe_unicode(request_path)
-                if path.startswith((u'data:', u'#', u':')):
+                if path.startswith((u'data:', u'javascript:', u'#', u':')):
                     # skip data, anchor, invalid links
                     return path
                 is_absolute = bool(urlparse.urlparse(path).netloc)
                 if is_absolute:
                     return path
                 if not request_path:
                     return path
                 if path.startswith(u'/'):
                     path = path[1:]
                 if path.startswith(u'./'):
                     path = path[2:]
                 parts = request_path.split('/')
                 # compute how deep we need to traverse the request_path
                 depth = 0
                 if is_repo_file(request_path):
                     # if request path is a VALID file, we use a relative path with
                     # one level up
                     depth += 1
                 while path.startswith(u'../'):
                     depth += 1
                     path = path[3:]
                 if depth > 0:
                     parts = parts[:-depth]
                 parts.append(path)
                 final_path = u'/'.join(parts).lstrip(u'/')
                 return u'/' + final_path
             class MarkupRenderer(object):
                 RESTRUCTUREDTEXT_DISALLOWED_DIRECTIVES = ['include', 'meta', 'raw']
                 MARKDOWN_PAT = re.compile(r'\.(md|mkdn?|mdown|markdown)$', re.IGNORECASE)
                 RST_PAT = re.compile(r'\.re?st$', re.IGNORECASE)
                 JUPYTER_PAT = re.compile(r'\.(ipynb)$', re.IGNORECASE)
                 PLAIN_PAT = re.compile(r'^readme$', re.IGNORECASE)
                 extensions = ['codehilite', 'extra', 'def_list', 'sane_lists']
                 markdown_renderer = markdown.Markdown(
                     extensions, safe_mode=True, enable_attributes=False)
                 markdown_renderer_flavored = markdown.Markdown(
                     extensions + [GithubFlavoredMarkdownExtension()], safe_mode=True,
                     enable_attributes=False)
                 # extension together with weights. Lower is first means we control how
                 # extensions are attached to readme names with those.
                 PLAIN_EXTS = [
                     # prefer no extension
                     ('', 0),  # special case that renders READMES names without extension
                     ('.text', 2), ('.TEXT', 2),
                     ('.txt', 3), ('.TXT', 3)
                 ]
                 RST_EXTS = [
                     ('.rst', 1), ('.rest', 1),
                     ('.RST', 2), ('.REST', 2)
                 ]
                 MARKDOWN_EXTS = [
                     ('.md', 1), ('.MD', 1),
                     ('.mkdn', 2), ('.MKDN', 2),
                     ('.mdown', 3), ('.MDOWN', 3),
                     ('.markdown', 4), ('.MARKDOWN', 4)
                 ]
                 def _detect_renderer(self, source, filename=None):
                     """
                     runs detection of what renderer should be used for generating html
                     from a markup language
                     filename can be also explicitly a renderer name
                     :param source:
                     :param filename:
                     """
                     if MarkupRenderer.MARKDOWN_PAT.findall(filename):
                         detected_renderer = 'markdown'
                     elif MarkupRenderer.RST_PAT.findall(filename):
                         detected_renderer = 'rst'
                     elif MarkupRenderer.JUPYTER_PAT.findall(filename):
                         detected_renderer = 'jupyter'
                     elif MarkupRenderer.PLAIN_PAT.findall(filename):
                         detected_renderer = 'plain'
                     else:
                         detected_renderer = 'plain'
                     return getattr(MarkupRenderer, detected_renderer)
                 @classmethod
                 def renderer_from_filename(cls, filename, exclude):
                     """
                     Detect renderer markdown/rst from filename and optionally use exclude
                     list to remove some options. This is mostly used in helpers.
                     Returns None when no renderer can be detected.
                     """
                     def _filter(elements):
                         if isinstance(exclude, (list, tuple)):
                             return [x for x in elements if x not in exclude]
                         return elements
                     if filename.endswith(
                             tuple(_filter([x[0] for x in cls.MARKDOWN_EXTS if x[0]]))):
                         return 'markdown'
                     if filename.endswith(tuple(_filter([x[0] for x in cls.RST_EXTS if x[0]]))):
                         return 'rst'
                     return None
                 def render(self, source, filename=None):
                     """
                     Renders a given filename using detected renderer
                     it detects renderers based on file extension or mimetype.
                     At last it will just do a simple html replacing new lines with <br/>
                     :param file_name:
                     :param source:
                     """
                     renderer = self._detect_renderer(source, filename)
                     readme_data = renderer(source)
                     return readme_data
                 @classmethod
                 def _flavored_markdown(cls, text):
                     """
                     Github style flavored markdown
                     :param text:
                     """
                     # Extract pre blocks.
                     extractions = {}
                     def pre_extraction_callback(matchobj):
                         digest = md5_safe(matchobj.group(0))
                         extractions[digest] = matchobj.group(0)
                         return "{gfm-extraction-%s}" % digest
                     pattern = re.compile(r'<pre>.*?</pre>', re.MULTILINE | re.DOTALL)
                     text = re.sub(pattern, pre_extraction_callback, text)
                     # Prevent foo_bar_baz from ending up with an italic word in the middle.
                     def italic_callback(matchobj):
                         s = matchobj.group(0)
                         if list(s).count('_') >= 2:
                             return s.replace('_', r'\_')
                         return s
                     text = re.sub(r'^(?! {4}|\t)\w+_\w+_\w[\w_]*', italic_callback, text)
                     # Insert pre block extractions.
                     def pre_insert_callback(matchobj):
                         return '\n\n' + extractions[matchobj.group(1)]
                     text = re.sub(r'\{gfm-extraction-([0-9a-f]{32})\}',
                                   pre_insert_callback, text)
                     return text
                 @classmethod
                 def urlify_text(cls, text):
                     url_pat = re.compile(r'(http[s]?://(?:[a-zA-Z]|[0-9]|[$-_@.&+]'
                                          r'|[!*\(\),]|(?:%[0-9a-fA-F][0-9a-fA-F]))+)')
                     def url_func(match_obj):
                         url_full = match_obj.groups()[0]
                         return '<a href="%(url)s">%(url)s</a>' % ({'url': url_full})
                     return url_pat.sub(url_func, text)
                 @classmethod
                 def plain(cls, source, universal_newline=True):
                     source = safe_unicode(source)
                     if universal_newline:
                         newline = '\n'
                         source = newline.join(source.splitlines())
                     source = cls.urlify_text(source)
                     return '<br />' + source.replace("\n", '<br />')
                 @classmethod
                 def markdown(cls, source, safe=True, flavored=True, mentions=False):
                     # It does not allow to insert inline HTML. In presence of HTML tags, it
                     # will replace them instead with [HTML_REMOVED]. This is controlled by
                     # the safe_mode=True parameter of the markdown method.
                     if flavored:
                         markdown_renderer = cls.markdown_renderer_flavored
                     else:
                         markdown_renderer = cls.markdown_renderer
                     if mentions:
                         mention_pat = re.compile(MENTIONS_REGEX)
                         def wrapp(match_obj):
                             uname = match_obj.groups()[0]
                             return ' **@%(uname)s** ' % {'uname': uname}
                         mention_hl = mention_pat.sub(wrapp, source).strip()
                         # we extracted mentions render with this using Mentions false
                         return cls.markdown(mention_hl, safe=safe, flavored=flavored,
                                             mentions=False)
                     source = safe_unicode(source)
                     try:
                         if flavored:
                             source = cls._flavored_markdown(source)
                         return markdown_renderer.convert(source)
                     except Exception:
                         log.exception('Error when rendering Markdown')
                         if safe:
                             log.debug('Fallback to render in plain mode')
                             return cls.plain(source)
                         else:
                             raise
                 @classmethod
                 def rst(cls, source, safe=True, mentions=False):
                     if mentions:
                         mention_pat = re.compile(MENTIONS_REGEX)
                         def wrapp(match_obj):
                             uname = match_obj.groups()[0]
                             return ' **@%(uname)s** ' % {'uname': uname}
                         mention_hl = mention_pat.sub(wrapp, source).strip()
                         # we extracted mentions render with this using Mentions false
                         return cls.rst(mention_hl, safe=safe, mentions=False)
                     source = safe_unicode(source)
                     try:
                         docutils_settings = dict(
                             [(alias, None) for alias in
                              cls.RESTRUCTUREDTEXT_DISALLOWED_DIRECTIVES])
                         docutils_settings.update({'input_encoding': 'unicode',
                                                   'report_level': 4})
                         for k, v in docutils_settings.iteritems():
                             directives.register_directive(k, v)
                         parts = publish_parts(source=source,
                                               writer_name="html4css1",
                                               settings_overrides=docutils_settings)
                         return parts['html_title'] + parts["fragment"]
                     except Exception:
                         log.exception('Error when rendering RST')
                         if safe:
                             log.debug('Fallbacking to render in plain mode')
                             return cls.plain(source)
                         else:
                             raise
                 @classmethod
                 def jupyter(cls, source, safe=True):
                     from rhodecode.lib import helpers
                     from traitlets.config import Config
                     import nbformat
                     from nbconvert import HTMLExporter
                     from nbconvert.preprocessors import Preprocessor
                     class CustomHTMLExporter(HTMLExporter):
                         def _template_file_default(self):
                             return 'basic'
                     class Sandbox(Preprocessor):
                         def preprocess(self, nb, resources):
                             sandbox_text = 'SandBoxed(IPython.core.display.Javascript object)'
                             for cell in nb['cells']:
                                 if safe and 'outputs' in cell:
                                     for cell_output in cell['outputs']:
                                         if 'data' in cell_output:
                                             if 'application/javascript' in cell_output['data']:
                                                 cell_output['data']['text/plain'] = sandbox_text
                                                 cell_output['data'].pop('application/javascript', None)
                             return nb, resources
                     def _sanitize_resources(resources):
                         """
                         Skip/sanitize some of the CSS generated and included in jupyter
                         so it doesn't messes up UI so much
                         """
                         # TODO(marcink): probably we should replace this with whole custom
                         # CSS set that doesn't screw up, but jupyter generated html has some
                         # special markers, so it requires Custom HTML exporter template with
                         # _default_template_path_default, to achieve that
                         # strip the reset CSS
                         resources[0] = resources[0][resources[0].find('/*! Source'):]
                         return resources
                     def as_html(notebook):
                         conf = Config()
                         conf.CustomHTMLExporter.preprocessors = [Sandbox]
                         html_exporter = CustomHTMLExporter(config=conf)
                         (body, resources) = html_exporter.from_notebook_node(notebook)
                         header = '<!-- ## IPYTHON NOTEBOOK RENDERING ## -->'
                         js = MakoTemplate(r'''
                         <!-- Load mathjax -->
                             <!-- MathJax configuration -->
                             <script type="text/x-mathjax-config">
                             MathJax.Hub.Config({
                                 jax: ["input/TeX","output/HTML-CSS", "output/PreviewHTML"],
                                 extensions: ["tex2jax.js","MathMenu.js","MathZoom.js", "fast-preview.js", "AssistiveMML.js", "[Contrib]/a11y/accessibility-menu.js"],
                                 TeX: {
                                     extensions: ["AMSmath.js","AMSsymbols.js","noErrors.js","noUndefined.js"]
                                 },
                                 tex2jax: {
                                     inlineMath: [ ['$','$'], ["\\(","\\)"] ],
                                     displayMath: [ ['$$','$$'], ["\\[","\\]"] ],
                                     processEscapes: true,
                                     processEnvironments: true
                                 },
                                 // Center justify equations in code and markdown cells. Elsewhere
                                 // we use CSS to left justify single line equations in code cells.
                                 displayAlign: 'center',
                                 "HTML-CSS": {
                                     styles: {'.MathJax_Display': {"margin": 0}},
                                     linebreaks: { automatic: true },
                                     availableFonts: ["STIX", "TeX"]
                                 },
                                 showMathMenu: false
                             });
                             </script>
                             <!-- End of mathjax configuration -->
                             <script src="${h.asset('js/src/math_jax/MathJax.js')}"></script>
                         ''').render(h=helpers)
                         css = '<style>{}</style>'.format(
                             ''.join(_sanitize_resources(resources['inlining']['css'])))
                         body = '\n'.join([header, css, js, body])
                         return body, resources
                     notebook = nbformat.reads(source, as_version=4)
                     (body, resources) = as_html(notebook)
                     return body
             class RstTemplateRenderer(object):
                 def __init__(self):
                     base = os.path.abspath(os.path.dirname(os.path.dirname(__file__)))
                     rst_template_dirs = [os.path.join(base, 'templates', 'rst_templates')]
                     self.template_store = TemplateLookup(
                         directories=rst_template_dirs,
                         input_encoding='utf-8',
                         imports=['from rhodecode.lib import helpers as h'])
                 def _get_template(self, templatename):
                     return self.template_store.get_template(templatename)
                 def render(self, template_name, **kwargs):
                     template = self._get_template(template_name)
                     return template.render(**kwargs)