u/bodqhrohro/swineboard Commit - r1765:7a6a61e1

Show domain next to URL if available

neko259 -

r1765:7a6a61e1 default

parent child

boards/forms/__init__.py

0 +3 -3

              from boards.forms.fields import UrlFileField
              from boards.mdx_neboard import formatters
              from boards.models import Tag
-             from boards.models.attachment.downloaders import download
+             from boards.models.attachment.downloaders import download, REGEX_MAGNET
              from boards.models.post import TITLE_MAX_LENGTH
              from boards.utils import validate_file_size, get_file_mimetype, \
                  FILE_EXTENSION_DELIMITER
              REGEX_TAGS = re.compile(r'^[\w\s\d]+$', re.UNICODE)
              REGEX_USERNAMES = re.compile(r'^[\w\s\d,]+$', re.UNICODE)
-             REGEX_URL = re.compile(r'^(http|https|ftp|magnet):\/\/', re.UNICODE)
+             REGEX_URL = re.compile(r'^(http|https|ftp):\/\/', re.UNICODE)
              VETERAN_POSTING_DELAY = 5
                              self._update_file_extension(file)
                          except forms.ValidationError as e:
                              # Assume we will get the plain URL instead of a file and save it
-                             if REGEX_URL.match(url):
+                             if REGEX_URL.match(url) or REGEX_MAGNET.match(url):
                                  logger.info('Error in forms: {}'.format(e))
                                  return url
                              else:

boards/management/commands/statistics.py

0 +3 -4

                      print('* Domains and their usage')
                      domains = {}
                      for attachment in Attachment.objects.exclude(url=''):
-                         full_domain = attachment.url.split('/')[2]
-                         domain = get_domain(full_domain)
+                         domain = get_domain(attachment.url)
                          if domain in domains:
                              domains[domain] += 1
                          else:
                      print('* File types')
                      mimetypes = Attachment.objects.filter(url='')\
-                             .values('mimetype').annotate(count=Count('id'))\
-                             .order_by('-count')
+                         .values('mimetype').annotate(count=Count('id'))\
+                         .order_by('-count')
                      for mimetype in mimetypes:
                          print('{}: {}'.format(mimetype['mimetype'], mimetype['count']))

boards/models/attachment/downloaders.py

0 +9 -7

-             import os
-             import re
-             from django.core.files.uploadedfile import SimpleUploadedFile, \
-                 TemporaryUploadedFile
+             import requests
+             from django.core.files.uploadedfile import TemporaryUploadedFile
              from pytube import YouTube
-             import requests
              from boards.utils import validate_file_size
              FILE_DOWNLOAD_CHUNK_BYTES = 200000
-             YOUTUBE_URL = re.compile(r'https?://((www\.)?youtube\.com/watch\?v=|youtu.be/)[-\w]+')
+             REGEX_YOUTUBE_URL = re.compile(r'https?://((www\.)?youtube\.com/watch\?v=|youtu.be/)[-\w]+')
+             REGEX_MAGNET = re.compile(r'magnet:\?xt=urn:(btih:)?[a-z0-9]{20,50}.*')
              TYPE_URL_ONLY = (
                  'application/xhtml+xml',
                  @staticmethod
                  def handles(url: str) -> bool:
-                     return YOUTUBE_URL.match(url)
+                     return REGEX_YOUTUBE_URL.match(url) is not None
              class NothingDownloader(Downloader):
                  @staticmethod
                  def handles(url: str) -> bool:
+                     if REGEX_MAGNET.match(url) or REGEX_YOUTUBE_URL.match(url):
+                         return True
                      response_head = requests.head(url, verify=False)
                      content_type = response_head.headers[HEADER_CONTENT_TYPE].split(';')[0]
-                     return content_type in TYPE_URL_ONLY and not YOUTUBE_URL.match(url)
+                     return content_type in TYPE_URL_ONLY
                  @staticmethod
                  def download(url: str):

boards/models/attachment/viewers.py

0 +12 -4

                  def get_view(self):
                      return '<div class="image">' \
                             '{}' \
-                            '</div>'.format(self.get_format_view())
+                            '<div class="image-metadata">{}</div>' \
+                            '</div>'.format(self.get_format_view(), get_domain(self.url))
                  def get_format_view(self):
                      protocol = self.url.split('://')[0]
-                     full_domain = self.url.split('/')[2]
-                     domain = get_domain(full_domain)
+                     domain = get_domain(self.url)
                      if protocol in URL_PROTOCOLS:
                          url_image_name = URL_PROTOCOLS.get(protocol)
-                     else:
+                     elif domain:
                          filename = 'images/domains/{}.png'.format(domain)
                          if file_exists(filename):
                              url_image_name = 'domains/' + domain
                          else:
                              url_image_name = FILE_STUB_URL
+                     else:
+                         url_image_name = FILE_STUB_URL
                      image_path = 'images/{}.png'.format(url_image_name)
                      image = static(image_path)
                      return '<a href="{}">' \
                             '<img class="url-image" src="{}" width="{}" height="{}"/>' \
                             '</a>'.format(self.url, image, w, h)
+                 def _get_protocol(self):
+                     pass

boards/utils.py

0 +19 -13

		@@ -153,21 +153,27 b' def get_domain(url: str) -> str:'
153	153	"""
154	154	Gets domain from an URL with random number of domain levels.
155	155	"""
156		~~level~~s = url.split('.')
157		if len(~~level~~s) < 2:
158		return url
159
160		top = levels[-1]
161		second = levels[-2]
	156	domain_parts = url.split('/')
	157	if len(domain_parts) >= 2:
	158	full_domain = domain_parts[2]
	159	else:
	160	full_domain = ''
162	161
163		has_third_level = len(levels) > 2
164		if has_third_level:
165		third = levels[-3]
	162	result = full_domain
	163	if full_domain:
	164	levels = full_domain.split('.')
	165	if len(levels) >= 2:
	166	top = levels[-1]
	167	second = levels[-2]
166	168
167		if has_third_level and ('{}.{}'.format(second, top) in KNOWN_DOMAINS):
168		result = '{}.{}.{}'.format(third, second, top)
169		else:
170		result = '{}.{}'.format(second, top)
	169	has_third_level = len(levels) > 2
	170	if has_third_level:
	171	third = levels[-3]
	172
	173	if has_third_level and ('{}.{}'.format(second, top) in KNOWN_DOMAINS):
	174	result = '{}.{}.{}'.format(third, second, top)
	175	else:
	176	result = '{}.{}'.format(second, top)
171	177
172	178	return result
173	179

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages