mirror of
https://github.com/marty-oehme/scripts.git
synced 2024-11-14 13:58:07 +00:00
203 lines
7.7 KiB
Python
203 lines
7.7 KiB
Python
import os
|
|
import re
|
|
import sys
|
|
import shutil
|
|
import hashlib
|
|
import platform
|
|
import subprocess
|
|
import urllib.error
|
|
import urllib.request
|
|
|
|
|
|
if platform.system() == 'Linux':
|
|
try:
|
|
import gi # TODO doesn't work on early Python 3 versions
|
|
gi.require_version('Gtk', '3.0')
|
|
from gi.repository import Gio, Gtk
|
|
except ImportError:
|
|
pass
|
|
|
|
|
|
class URL:
|
|
def __init__(self, url, folder_dir_path):
|
|
"""
|
|
:param url: http(s)://...
|
|
:param folder_dir_path: full absolute path to the note folder, to know where media folder is
|
|
"""
|
|
self.url = url.strip()
|
|
self.folder_dir_path = folder_dir_path
|
|
|
|
@property
|
|
def icon(self):
|
|
"""
|
|
Get URL favicon from google's service
|
|
:return: full absolute path to favicon image this function saved to media/favicons or nothing
|
|
"""
|
|
try:
|
|
favicon = urllib.request.urlopen('http://www.google.com/s2/favicons?domain=' + self.url, timeout=5)
|
|
except (urllib.error.HTTPError, urllib.error.URLError):
|
|
return
|
|
|
|
favicon_content = favicon.read()
|
|
favicon_hash = hashlib.md5(favicon_content).hexdigest()
|
|
|
|
if favicon_hash == '3ca64f83fdcf25135d87e08af65e68c9': # google's dummy icon
|
|
return
|
|
else:
|
|
favicon_dir_path = self.folder_dir_path + os.sep + 'media' + os.sep + 'favicons'
|
|
os.makedirs(favicon_dir_path, exist_ok=True)
|
|
favicon_path = favicon_dir_path + os.sep + favicon_hash + '.png'
|
|
if not os.path.isfile(favicon_path):
|
|
with open(favicon_path, 'wb') as favicon_file:
|
|
favicon_file.write(favicon_content)
|
|
return favicon_path
|
|
|
|
@property
|
|
def title(self):
|
|
"""
|
|
Try to parse title from the web page located at URL
|
|
:return: web page title for URL or nothing
|
|
"""
|
|
try:
|
|
html_text = urllib.request.urlopen(self.url).read().decode('utf-8') # TODO encodings other that utf-8, https fails on early Python 3 versions
|
|
except (urllib.error.HTTPError, urllib.error.URLError, UnicodeDecodeError):
|
|
title = ''
|
|
else:
|
|
title = re.search('<title.*?>(.+?)</title>', html_text, re.IGNORECASE | re.DOTALL).group(1)
|
|
|
|
if title:
|
|
return title
|
|
else:
|
|
return self.url.split('//')[-1].split('/')[0]
|
|
|
|
@property
|
|
def md(self):
|
|
"""
|
|
Get the most informative markdown syntax link for URL, with favicon and title if available
|
|
:return: Markdown syntax link for URL
|
|
"""
|
|
if self.icon:
|
|
md_favicon = '![](file://media/favicons/{}) '.format(os.path.basename(self.icon))
|
|
else:
|
|
md_favicon = ''
|
|
|
|
if self.title:
|
|
md_link = '[{}]({})'.format(self.title, self.url)
|
|
else:
|
|
md_link = '<{}>'.format(self.url)
|
|
|
|
return md_favicon + md_link
|
|
|
|
|
|
class File:
|
|
def __init__(self, link_path, folder_dir_path, title=''):
|
|
"""
|
|
:param link_path: full absolute path to the file
|
|
:param folder_dir_path: full absolute path to the note folder, to know where media folder is
|
|
:param title: optionally specify the file's title, otherwise file name will be used as such
|
|
"""
|
|
self.path = link_path.strip()
|
|
self.folder_dir_path = folder_dir_path
|
|
self.filename = os.path.basename(self.path)
|
|
self.ext = os.path.splitext(self.filename)[1]
|
|
|
|
if self.ext == '.pdf':
|
|
self.type = 'pdf'
|
|
elif self.ext in ('.jpg', '.jpeg', '.png', '.gif'):
|
|
self.type = 'image'
|
|
else:
|
|
self.type = 'other'
|
|
|
|
if title:
|
|
self.title = title
|
|
else:
|
|
self.title = os.path.splitext(self.filename)[0]
|
|
|
|
@property
|
|
def icon(self, icon_size=16, save=True):
|
|
"""
|
|
Get file type icon for File
|
|
:param icon_size: requested icon size
|
|
:param save: True to copy icon to media flder, otherwise will return path where OS stores the icon
|
|
:return: full absolute path to File icon or nothing
|
|
"""
|
|
if platform.system() == 'Linux':
|
|
try:
|
|
file = Gio.File.new_for_path(self.path)
|
|
|
|
file_info = file.query_info('standard::icon', 0, Gio.Cancellable())
|
|
file_icon = file_info.get_icon().get_names()[0]
|
|
|
|
icon_theme = Gtk.IconTheme.get_default()
|
|
icon_info = icon_theme.lookup_icon(file_icon, icon_size, 0)
|
|
icon_path = icon_info.get_filename()
|
|
except (NameError, AttributeError):
|
|
return ''
|
|
|
|
if os.path.isfile(icon_path):
|
|
if save:
|
|
icon_store_path = os.path.join(self.folder_dir_path, 'media', 'fileicons')
|
|
if not os.path.isfile(icon_store_path + os.sep + os.path.basename(icon_path)):
|
|
try:
|
|
os.makedirs(icon_store_path, exist_ok=True)
|
|
icon_path = shutil.copy(icon_path, icon_store_path)
|
|
icon_path = 'media/fileicons/' + os.path.basename(icon_path)
|
|
except OSError:
|
|
pass
|
|
|
|
return icon_path
|
|
|
|
@property
|
|
def thumb(self):
|
|
"""
|
|
Make a thumbnail for appropriate File
|
|
:return: full absolute path to File's thumbnail or nothing
|
|
"""
|
|
if self.type == 'pdf':
|
|
if platform.system() == 'Linux':
|
|
dpi = 30
|
|
thumb_path = os.path.join(self.folder_dir_path, 'media', 'thumbnails', 'th_' + self.filename + '.png')
|
|
os.makedirs(os.path.dirname(thumb_path), exist_ok=True)
|
|
|
|
subprocess.call(['gs', '-q', '-dNOPAUSE', '-dBATCH', '-sDEVICE=png16m', '-r' + str(dpi),
|
|
'-sOutputFile=' + thumb_path, '-dLastPage=1', self.path],
|
|
timeout=10)
|
|
|
|
if os.path.isfile(thumb_path):
|
|
return thumb_path
|
|
|
|
if self.type == 'image':
|
|
if platform.system() == 'Linux':
|
|
target_width = 600
|
|
img_width = int(subprocess.check_output(['identify', '-ping', '-format', '%w', self.path],
|
|
timeout=5).decode(sys.stdout.encoding))
|
|
if img_width > target_width:
|
|
thumb_path = os.path.join(self.folder_dir_path, 'media', 'thumbnails', 'th_' + self.filename)
|
|
os.makedirs(os.path.dirname(thumb_path), exist_ok=True)
|
|
|
|
subprocess.call(['convert', self.path, '-thumbnail', str(target_width),
|
|
'-auto-orient', '-unsharp', '0x.5', thumb_path],
|
|
timeout=10)
|
|
|
|
if os.path.isfile(thumb_path):
|
|
return thumb_path
|
|
|
|
@property
|
|
def md(self):
|
|
"""
|
|
Get the most informative markdown syntax link for File, as a thumbnail or with file icon if available
|
|
:return: Markdown syntax link for File
|
|
"""
|
|
link_path = os.path.relpath(self.path, self.folder_dir_path).replace(os.sep, '/')
|
|
thumb = self.thumb
|
|
if thumb:
|
|
return '[![{}](file://{})](file://{})'.format(self.title, 'media/thumbnails/' + os.path.basename(thumb), link_path)
|
|
elif self.type == 'image':
|
|
return '![{}](file://{})'.format(self.title, link_path)
|
|
else:
|
|
icon = self.icon
|
|
if icon:
|
|
return '![](file://{})'.format('media/fileicons/' + os.path.basename(self.icon)) + ' ' + \
|
|
'[{}](file://{})'.format(self.title, link_path)
|
|
else:
|
|
return '[{}](file://{})'.format(self.title, link_path)
|