1
0
mirror of synced 2024-11-29 04:34:23 +01:00
mat2/libmat2/images.py

125 lines
4.6 KiB
Python
Raw Normal View History

2018-03-25 15:09:12 +02:00
import subprocess
import imghdr
2018-03-25 15:09:12 +02:00
import json
2018-04-01 00:43:36 +02:00
import os
import shutil
import tempfile
import re
from typing import Set
2018-03-25 15:09:12 +02:00
import cairo
2018-03-25 15:09:12 +02:00
import gi
gi.require_version('GdkPixbuf', '2.0')
from gi.repository import GdkPixbuf
2018-09-01 15:07:01 +02:00
from . import abstract, _get_exiftool_path
2018-03-25 15:09:12 +02:00
# Make pyflakes happy
assert Set
class _ImageParser(abstract.AbstractParser):
2018-07-19 23:10:27 +02:00
""" Since we use `exiftool` to get metadata from
all images fileformat, `get_meta` is implemented in this class,
and all the image-handling ones are inheriting from it."""
meta_whitelist = set() # type: Set[str]
@staticmethod
def __handle_problematic_filename(filename: str, callback) -> str:
""" This method takes a filename with a problematic name,
and safely applies it a `callback`."""
tmpdirname = tempfile.mkdtemp()
fname = os.path.join(tmpdirname, "temp_file")
shutil.copy(filename, fname)
out = callback(fname)
shutil.rmtree(tmpdirname)
return out
def get_meta(self):
""" There is no way to escape the leading(s) dash(es) of the current
self.filename to prevent parameter injections, so we need to take care
of this.
"""
2018-09-01 15:07:01 +02:00
fun = lambda f: subprocess.check_output([_get_exiftool_path(), '-json', f])
if re.search('^[a-z0-9/]', self.filename) is None:
out = self.__handle_problematic_filename(self.filename, fun)
else:
out = fun(self.filename)
meta = json.loads(out.decode('utf-8'))[0]
for key in self.meta_whitelist:
meta.pop(key, None)
return meta
class PNGParser(_ImageParser):
mimetypes = {'image/png', }
meta_whitelist = {'SourceFile', 'ExifToolVersion', 'FileName',
2018-05-16 22:36:59 +02:00
'Directory', 'FileSize', 'FileModifyDate',
'FileAccessDate', 'FileInodeChangeDate',
'FilePermissions', 'FileType', 'FileTypeExtension',
'MIMEType', 'ImageWidth', 'BitDepth', 'ColorType',
'Compression', 'Filter', 'Interlace', 'BackgroundColor',
'ImageSize', 'Megapixels', 'ImageHeight'}
def __init__(self, filename):
super().__init__(filename)
if imghdr.what(filename) != 'png':
raise ValueError
try: # better fail here than later
cairo.ImageSurface.create_from_png(self.filename)
2018-09-12 14:54:54 +02:00
except MemoryError: # pragma: no cover
raise ValueError
def remove_all(self):
surface = cairo.ImageSurface.create_from_png(self.filename)
surface.write_to_png(self.output_filename)
return True
class GdkPixbufAbstractParser(_ImageParser):
2018-04-02 23:40:08 +02:00
""" GdkPixbuf can handle a lot of surfaces, so we're rending images on it,
2018-07-19 23:10:27 +02:00
this has the side-effect of completely removing metadata.
2018-04-02 23:40:08 +02:00
"""
_type = ''
2018-03-25 15:09:12 +02:00
def remove_all(self):
2018-04-01 00:43:36 +02:00
_, extension = os.path.splitext(self.filename)
2018-03-25 15:09:12 +02:00
pixbuf = GdkPixbuf.Pixbuf.new_from_file(self.filename)
if extension.lower() == '.jpg':
extension = '.jpeg' # gdk is picky
pixbuf.savev(self.output_filename, extension[1:], [], [])
2018-03-25 15:09:12 +02:00
return True
2018-04-01 00:43:36 +02:00
def __init__(self, filename):
super().__init__(filename)
if imghdr.what(filename) != self._type: # better safe than sorry
raise ValueError
2018-04-01 00:43:36 +02:00
class JPGParser(GdkPixbufAbstractParser):
_type = 'jpeg'
mimetypes = {'image/jpeg'}
2018-04-01 00:43:36 +02:00
meta_whitelist = {'SourceFile', 'ExifToolVersion', 'FileName',
2018-05-16 22:36:59 +02:00
'Directory', 'FileSize', 'FileModifyDate',
'FileAccessDate', "FileInodeChangeDate",
'FilePermissions', 'FileType', 'FileTypeExtension',
'MIMEType', 'ImageWidth', 'ImageSize', 'BitsPerSample',
'ColorComponents', 'EncodingProcess', 'JFIFVersion',
'ResolutionUnit', 'XResolution', 'YCbCrSubSampling',
'YResolution', 'Megapixels', 'ImageHeight'}
2018-04-01 00:43:36 +02:00
class TiffParser(GdkPixbufAbstractParser):
_type = 'tiff'
2018-04-01 00:43:36 +02:00
mimetypes = {'image/tiff'}
meta_whitelist = {'Compression', 'ExifByteOrder', 'ExtraSamples',
2018-05-16 22:36:59 +02:00
'FillOrder', 'PhotometricInterpretation',
'PlanarConfiguration', 'RowsPerStrip', 'SamplesPerPixel',
'StripByteCounts', 'StripOffsets', 'BitsPerSample',
'Directory', 'ExifToolVersion', 'FileAccessDate',
'FileInodeChangeDate', 'FileModifyDate', 'FileName',
'FilePermissions', 'FileSize', 'FileType',
'FileTypeExtension', 'ImageHeight', 'ImageSize',
'ImageWidth', 'MIMEType', 'Megapixels', 'SourceFile'}