""" This module provides some useful tools for ``vcs`` like annotate/diff html output. It also includes some internal helpers. """ import sys import time import datetime def makedate(): lt = time.localtime() if lt[8] == 1 and time.daylight: tz = time.altzone else: tz = time.timezone return time.mktime(lt), tz def date_fromtimestamp(unixts, tzoffset=0): """ Makes a local datetime object out of unix timestamp :param unixts: :param tzoffset: """ return datetime.datetime.fromtimestamp(float(unixts)) def safe_unicode(str_, from_encoding='utf8'): """ safe unicode function. Does few trick to turn str_ into unicode In case of UnicodeDecode error we try to return it with encoding detected by chardet library if it fails fallback to unicode with errors replaced :param str_: string to decode :rtype: unicode :returns: unicode object """ if isinstance(str_, unicode): return str_ try: return unicode(str_) except UnicodeDecodeError: pass try: return unicode(str_, from_encoding) except UnicodeDecodeError: pass try: import chardet encoding = chardet.detect(str_)['encoding'] if encoding is None: raise Exception() return str_.decode(encoding) except (ImportError, UnicodeDecodeError, Exception): return unicode(str_, from_encoding, 'replace') def safe_str(unicode_, to_encoding='utf8'): """ safe str function. Does few trick to turn unicode_ into string In case of UnicodeEncodeError we try to return it with encoding detected by chardet library if it fails fallback to string with errors replaced :param unicode_: unicode to encode :rtype: str :returns: str object """ if isinstance(unicode_, str): return unicode_ try: return unicode_.encode(to_encoding) except UnicodeEncodeError: pass try: import chardet encoding = chardet.detect(unicode_)['encoding'] print encoding if encoding is None: raise UnicodeEncodeError() return unicode_.encode(encoding) except (ImportError, UnicodeEncodeError): return unicode_.encode(to_encoding, 'replace') return safe_str def author_email(author): """ returns email address of given author. If any of <,> sign are found, it fallbacks to regex findall() and returns first found result or empty string Regex taken from http://www.regular-expressions.info/email.html """ import re r = author.find('>') l = author.find('<') if l == -1 or r == -1: # fallback to regex match of email out of a string email_re = re.compile(r"""[a-z0-9!#$%&'*+/=?^_`{|}~-]+(?:\.[a-z0-9!""" r"""#$%&'*+/=?^_`{|}~-]+)*@(?:[a-z0-9](?:[a-z""" r"""0-9-]*[a-z0-9])?\.)+[a-z0-9](?:[a-z0-9-]""" r"""*[a-z0-9])?""", re.IGNORECASE) m = re.findall(email_re, author) return m[0] if m else '' return author[l + 1:r].strip() def author_name(author): """ get name of author, or else username. It'll try to find an email in the author string and just cut it off to get the username """ if not '@' in author: return author else: return author.replace(author_email(author), '').replace('<', '')\ .replace('>', '').strip()