##// END OF EJS Templates
safe_unicode never fails. No need to catch decode exceptions
safe_unicode never fails. No need to catch decode exceptions

File last commit:

r2278:24095abd beta
r2297:4747af4c beta
Show More
__init__.py
138 lines | 3.7 KiB | text/x-python | PythonLexer
Added VCS into rhodecode core for faster and easier deployments of new versions
r2007 """
This module provides some useful tools for ``vcs`` like annotate/diff html
output. It also includes some internal helpers.
"""
import sys
import time
import datetime
def makedate():
lt = time.localtime()
if lt[8] == 1 and time.daylight:
tz = time.altzone
else:
tz = time.timezone
return time.mktime(lt), tz
def date_fromtimestamp(unixts, tzoffset=0):
"""
Makes a local datetime object out of unix timestamp
:param unixts:
:param tzoffset:
"""
return datetime.datetime.fromtimestamp(float(unixts))
implements #212 moved default encoding variable into rhodecode-config. It's now possible to change...
r2016 def safe_unicode(str_, from_encoding=None):
Added VCS into rhodecode core for faster and easier deployments of new versions
r2007 """
safe unicode function. Does few trick to turn str_ into unicode
In case of UnicodeDecode error we try to return it with encoding detected
by chardet library if it fails fallback to unicode with errors replaced
:param str_: string to decode
:rtype: unicode
:returns: unicode object
"""
if isinstance(str_, unicode):
return str_
implements #212 moved default encoding variable into rhodecode-config. It's now possible to change...
r2016 if not from_encoding:
import rhodecode
more work on improving info logging
r2025 DEFAULT_ENCODING = rhodecode.CONFIG.get('default_encoding', 'utf8')
implements #212 moved default encoding variable into rhodecode-config. It's now possible to change...
r2016 from_encoding = DEFAULT_ENCODING
Added VCS into rhodecode core for faster and easier deployments of new versions
r2007 try:
return unicode(str_)
except UnicodeDecodeError:
pass
try:
return unicode(str_, from_encoding)
except UnicodeDecodeError:
pass
try:
import chardet
encoding = chardet.detect(str_)['encoding']
if encoding is None:
raise Exception()
return str_.decode(encoding)
except (ImportError, UnicodeDecodeError, Exception):
return unicode(str_, from_encoding, 'replace')
implements #212 moved default encoding variable into rhodecode-config. It's now possible to change...
r2016 def safe_str(unicode_, to_encoding=None):
Added VCS into rhodecode core for faster and easier deployments of new versions
r2007 """
safe str function. Does few trick to turn unicode_ into string
In case of UnicodeEncodeError we try to return it with encoding detected
by chardet library if it fails fallback to string with errors replaced
:param unicode_: unicode to encode
:rtype: str
:returns: str object
"""
if isinstance(unicode_, str):
return unicode_
implements #212 moved default encoding variable into rhodecode-config. It's now possible to change...
r2016 if not to_encoding:
import rhodecode
more work on improving info logging
r2025 DEFAULT_ENCODING = rhodecode.CONFIG.get('default_encoding', 'utf8')
implements #212 moved default encoding variable into rhodecode-config. It's now possible to change...
r2016 to_encoding = DEFAULT_ENCODING
Added VCS into rhodecode core for faster and easier deployments of new versions
r2007 try:
return unicode_.encode(to_encoding)
except UnicodeEncodeError:
pass
try:
import chardet
encoding = chardet.detect(unicode_)['encoding']
if encoding is None:
raise UnicodeEncodeError()
return unicode_.encode(encoding)
except (ImportError, UnicodeEncodeError):
return unicode_.encode(to_encoding, 'replace')
return safe_str
def author_email(author):
"""
returns email address of given author.
If any of <,> sign are found, it fallbacks to regex findall()
and returns first found result or empty string
Regex taken from http://www.regular-expressions.info/email.html
"""
import re
r = author.find('>')
l = author.find('<')
if l == -1 or r == -1:
# fallback to regex match of email out of a string
email_re = re.compile(r"""[a-z0-9!#$%&'*+/=?^_`{|}~-]+(?:\.[a-z0-9!"""
r"""#$%&'*+/=?^_`{|}~-]+)*@(?:[a-z0-9](?:[a-z"""
r"""0-9-]*[a-z0-9])?\.)+[a-z0-9](?:[a-z0-9-]"""
r"""*[a-z0-9])?""", re.IGNORECASE)
m = re.findall(email_re, author)
return m[0] if m else ''
return author[l + 1:r].strip()
def author_name(author):
"""
get name of author, or else username.
It'll try to find an email in the author string and just cut it off
to get the username
"""
if not '@' in author:
return author
else:
return author.replace(author_email(author), '').replace('<', '')\
.replace('>', '').strip()