u/bodqhrohro/swineboard Commit - r1765:7a6a61e1

Show domain next to URL if available

neko259 -

r1765:7a6a61e1 default

parent child

boards/forms/__init__.py

0 +3 -3

             from boards.forms.fields import UrlFileField
             from boards.mdx_neboard import formatters
             from boards.models import Tag
-            from boards.models.attachment.downloaders import download
+            from boards.models.attachment.downloaders import download, REGEX_MAGNET
             from boards.models.post import TITLE_MAX_LENGTH
             from boards.utils import validate_file_size, get_file_mimetype, \
                 FILE_EXTENSION_DELIMITER
             REGEX_TAGS = re.compile(r'^[\w\s\d]+$', re.UNICODE)
             REGEX_USERNAMES = re.compile(r'^[\w\s\d,]+$', re.UNICODE)
-            REGEX_URL = re.compile(r'^(http|https|ftp|magnet):\/\/', re.UNICODE)
+            REGEX_URL = re.compile(r'^(http|https|ftp):\/\/', re.UNICODE)
             VETERAN_POSTING_DELAY = 5
                             self._update_file_extension(file)
                         except forms.ValidationError as e:
                             # Assume we will get the plain URL instead of a file and save it
-                            if REGEX_URL.match(url):
+                            if REGEX_URL.match(url) or REGEX_MAGNET.match(url):
                                 logger.info('Error in forms: {}'.format(e))
                                 return url
                             else:

boards/management/commands/statistics.py

0 +3 -4

                     print('* Domains and their usage')
                     domains = {}
                     for attachment in Attachment.objects.exclude(url=''):
-                        full_domain = attachment.url.split('/')[2]
+                        domain = get_domain(attachment.url)
-                        domain = get_domain(full_domain)
                         if domain in domains:
                             domains[domain] += 1
                         else:
                     print('* File types')
                     mimetypes = Attachment.objects.filter(url='')\
-                            .values('mimetype').annotate(count=Count('id'))\
+                        .values('mimetype').annotate(count=Count('id'))\
-                            .order_by('-count')
+                        .order_by('-count')
                     for mimetype in mimetypes:
                         print('{}: {}'.format(mimetype['mimetype'], mimetype['count']))

boards/models/attachment/downloaders.py

0 +9 -7

-            import os
             import re
-            from django.core.files.uploadedfile import SimpleUploadedFile, \
+            import requests
-                TemporaryUploadedFile
+            from django.core.files.uploadedfile import TemporaryUploadedFile
             from pytube import YouTube
-            import requests
             from boards.utils import validate_file_size
             FILE_DOWNLOAD_CHUNK_BYTES = 200000
-            YOUTUBE_URL = re.compile(r'https?://((www\.)?youtube\.com/watch\?v=|youtu.be/)[-\w]+')
+            REGEX_YOUTUBE_URL = re.compile(r'https?://((www\.)?youtube\.com/watch\?v=|youtu.be/)[-\w]+')
+            REGEX_MAGNET = re.compile(r'magnet:\?xt=urn:(btih:)?[a-z0-9]{20,50}.*')
             TYPE_URL_ONLY = (
                 'application/xhtml+xml',
                 @staticmethod
                 def handles(url: str) -> bool:
-                    return YOUTUBE_URL.match(url)
+                    return REGEX_YOUTUBE_URL.match(url) is not None
             class NothingDownloader(Downloader):
                 @staticmethod
                 def handles(url: str) -> bool:
+                    if REGEX_MAGNET.match(url) or REGEX_YOUTUBE_URL.match(url):
+                        return True
                     response_head = requests.head(url, verify=False)
                     content_type = response_head.headers[HEADER_CONTENT_TYPE].split(';')[0]
-                    return content_type in TYPE_URL_ONLY and not YOUTUBE_URL.match(url)
+                    return content_type in TYPE_URL_ONLY
                 @staticmethod
                 def download(url: str):

boards/models/attachment/viewers.py

0 +12 -4

                 def get_view(self):
                     return '<div class="image">' \
                            '{}' \
-                           '</div>'.format(self.get_format_view())
+                           '<div class="image-metadata">{}</div>' \
+                           '</div>'.format(self.get_format_view(), get_domain(self.url))
                 def get_format_view(self):
                     protocol = self.url.split('://')[0]
-                    full_domain = self.url.split('/')[2]
-                    domain = get_domain(full_domain)
+                    domain = get_domain(self.url)
                     if protocol in URL_PROTOCOLS:
                         url_image_name = URL_PROTOCOLS.get(protocol)
-                    else:
+                    elif domain:
                         filename = 'images/domains/{}.png'.format(domain)
                         if file_exists(filename):
                             url_image_name = 'domains/' + domain
                         else:
                             url_image_name = FILE_STUB_URL
+                    else:
+                        url_image_name = FILE_STUB_URL
                     image_path = 'images/{}.png'.format(url_image_name)
                     image = static(image_path)
                     return '<a href="{}">' \
                            '<img class="url-image" src="{}" width="{}" height="{}"/>' \
                            '</a>'.format(self.url, image, w, h)
+                def _get_protocol(self):
+                    pass

boards/utils.py

0 +19 -13

@@ -153,21 +153,27 b' def get_domain(url: str) -> str:'
153	"""	153	"""
154	Gets domain from an URL with random number of domain levels.	154	Gets domain from an URL with random number of domain levels.
155	"""	155	"""
156	~~level~~s = url.split('.')	156	domain_parts = url.split('/')
157	if len(~~level~~s) < 2:	157	if len(domain_parts) >= 2:
158	return url	158	full_domain = domain_parts[2]
159		159	else:
160	top = levels[-1]	160	full_domain = ''
161	second = levels[-2]
162		161
163	has_third_level = len(levels) > 2	162	result = full_domain
164	if has_third_level:	163	if full_domain:
165	third = levels[-3]	164	levels = full_domain.split('.')
		165	if len(levels) >= 2:
		166	top = levels[-1]
		167	second = levels[-2]
166		168
167	if has_third_level and ('{}.{}'.format(second, top) in KNOWN_DOMAINS):	169	has_third_level = len(levels) > 2
168	result = '{}.{}.{}'.format(third, second, top)	170	if has_third_level:
169	else:	171	third = levels[-3]
170	result = '{}.{}'.format(second, top)	172
		173	if has_third_level and ('{}.{}'.format(second, top) in KNOWN_DOMAINS):
		174	result = '{}.{}.{}'.format(third, second, top)
		175	else:
		176	result = '{}.{}'.format(second, top)
171		177
172	return result	178	return result
173		179

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages