2016-01-06 21:26:29 -07:00
|
|
|
# Copyright 2014-2016 OpenMarket Ltd
|
2021-01-15 08:57:37 -07:00
|
|
|
# Copyright 2020-2021 The Matrix.org Foundation C.I.C.
|
2014-12-05 09:12:37 -07:00
|
|
|
#
|
|
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
# you may not use this file except in compliance with the License.
|
|
|
|
# You may obtain a copy of the License at
|
|
|
|
#
|
|
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
#
|
|
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
# See the License for the specific language governing permissions and
|
|
|
|
# limitations under the License.
|
2018-07-09 00:09:20 -06:00
|
|
|
import logging
|
2014-12-10 07:46:55 -07:00
|
|
|
from io import BytesIO
|
2022-06-01 04:57:49 -06:00
|
|
|
from types import TracebackType
|
|
|
|
from typing import Optional, Tuple, Type
|
2014-12-10 07:46:55 -07:00
|
|
|
|
2020-09-09 10:59:41 -06:00
|
|
|
from PIL import Image
|
2017-01-10 07:19:50 -07:00
|
|
|
|
2023-07-05 09:22:21 -06:00
|
|
|
from synapse.logging.opentracing import trace
|
|
|
|
|
2017-01-10 07:19:50 -07:00
|
|
|
logger = logging.getLogger(__name__)
|
|
|
|
|
2019-05-16 12:04:26 -06:00
|
|
|
EXIF_ORIENTATION_TAG = 0x0112
|
|
|
|
EXIF_TRANSPOSE_MAPPINGS = {
|
|
|
|
2: Image.FLIP_LEFT_RIGHT,
|
|
|
|
3: Image.ROTATE_180,
|
|
|
|
4: Image.FLIP_TOP_BOTTOM,
|
|
|
|
5: Image.TRANSPOSE,
|
|
|
|
6: Image.ROTATE_270,
|
|
|
|
7: Image.TRANSVERSE,
|
|
|
|
8: Image.ROTATE_90,
|
|
|
|
}
|
|
|
|
|
2014-12-05 09:12:37 -07:00
|
|
|
|
2020-09-09 10:59:41 -06:00
|
|
|
class ThumbnailError(Exception):
|
|
|
|
"""An error occurred generating a thumbnail."""
|
|
|
|
|
|
|
|
|
2020-09-04 04:54:56 -06:00
|
|
|
class Thumbnailer:
|
2014-12-10 07:46:55 -07:00
|
|
|
FORMATS = {"image/jpeg": "JPEG", "image/png": "PNG"}
|
2014-12-05 09:12:37 -07:00
|
|
|
|
2021-05-21 10:31:59 -06:00
|
|
|
@staticmethod
|
2021-09-15 06:45:32 -06:00
|
|
|
def set_limits(max_image_pixels: int) -> None:
|
2021-05-21 10:31:59 -06:00
|
|
|
Image.MAX_IMAGE_PIXELS = max_image_pixels
|
|
|
|
|
2021-01-15 08:57:37 -07:00
|
|
|
def __init__(self, input_path: str):
|
2022-06-01 04:57:49 -06:00
|
|
|
# Have we closed the image?
|
|
|
|
self._closed = False
|
|
|
|
|
2020-09-09 10:59:41 -06:00
|
|
|
try:
|
|
|
|
self.image = Image.open(input_path)
|
|
|
|
except OSError as e:
|
|
|
|
# If an error occurs opening the image, a thumbnail won't be able to
|
|
|
|
# be generated.
|
|
|
|
raise ThumbnailError from e
|
2021-05-21 10:31:59 -06:00
|
|
|
except Image.DecompressionBombError as e:
|
|
|
|
# If an image decompression bomb error occurs opening the image,
|
|
|
|
# then the image exceeds the pixel limit and a thumbnail won't
|
|
|
|
# be able to be generated.
|
|
|
|
raise ThumbnailError from e
|
2020-09-09 10:59:41 -06:00
|
|
|
|
2014-12-05 09:12:37 -07:00
|
|
|
self.width, self.height = self.image.size
|
2019-05-16 12:04:26 -06:00
|
|
|
self.transpose_method = None
|
|
|
|
try:
|
|
|
|
# We don't use ImageOps.exif_transpose since it crashes with big EXIF
|
2021-10-08 07:49:41 -06:00
|
|
|
#
|
|
|
|
# Ignore safety: Pillow seems to acknowledge that this method is
|
|
|
|
# "private, experimental, but generally widely used". Pillow 6
|
|
|
|
# includes a public getexif() method (no underscore) that we might
|
|
|
|
# consider using instead when we can bump that dependency.
|
|
|
|
#
|
|
|
|
# At the time of writing, Debian buster (currently oldstable)
|
|
|
|
# provides version 5.4.1. It's expected to EOL in mid-2022, see
|
|
|
|
# https://wiki.debian.org/DebianReleases#Production_Releases
|
|
|
|
image_exif = self.image._getexif() # type: ignore
|
2019-05-16 12:04:26 -06:00
|
|
|
if image_exif is not None:
|
|
|
|
image_orientation = image_exif.get(EXIF_ORIENTATION_TAG)
|
Prefer `type(x) is int` to `isinstance(x, int)` (#14945)
* Perfer `type(x) is int` to `isinstance(x, int)`
This covered all additional instances I could see where `x` was
user-controlled.
The remaining cases are
```
$ rg -s 'isinstance.*[^_]int'
tests/replication/_base.py
576: if isinstance(obj, int):
synapse/util/caches/stream_change_cache.py
136: assert isinstance(stream_pos, int)
214: assert isinstance(stream_pos, int)
246: assert isinstance(stream_pos, int)
267: assert isinstance(stream_pos, int)
synapse/replication/tcp/external_cache.py
133: if isinstance(result, int):
synapse/metrics/__init__.py
100: if isinstance(calls, (int, float)):
synapse/handlers/appservice.py
262: assert isinstance(new_token, int)
synapse/config/_util.py
62: if isinstance(p, int):
```
which cover metrics, logic related to `jsonschema`, and replication and
data streams. AFAICS these are all internal to Synapse
* Changelog
2023-01-31 03:33:07 -07:00
|
|
|
assert type(image_orientation) is int
|
2019-05-16 12:04:26 -06:00
|
|
|
self.transpose_method = EXIF_TRANSPOSE_MAPPINGS.get(image_orientation)
|
|
|
|
except Exception as e:
|
|
|
|
# A lot of parsing errors can happen when parsing EXIF
|
|
|
|
logger.info("Error parsing image EXIF information: %s", e)
|
|
|
|
|
2023-07-05 09:22:21 -06:00
|
|
|
@trace
|
2021-01-15 08:57:37 -07:00
|
|
|
def transpose(self) -> Tuple[int, int]:
|
2019-05-16 12:04:26 -06:00
|
|
|
"""Transpose the image using its EXIF Orientation tag
|
|
|
|
|
|
|
|
Returns:
|
2021-01-15 08:57:37 -07:00
|
|
|
A tuple containing the new image size in pixels as (width, height).
|
2019-05-16 12:04:26 -06:00
|
|
|
"""
|
|
|
|
if self.transpose_method is not None:
|
2021-10-08 07:49:41 -06:00
|
|
|
# Safety: `transpose` takes an int rather than e.g. an IntEnum.
|
|
|
|
# self.transpose_method is set above to be a value in
|
|
|
|
# EXIF_TRANSPOSE_MAPPINGS, and that only contains correct values.
|
2022-06-01 04:57:49 -06:00
|
|
|
with self.image:
|
|
|
|
self.image = self.image.transpose(self.transpose_method) # type: ignore[arg-type]
|
2019-05-16 12:04:26 -06:00
|
|
|
self.width, self.height = self.image.size
|
|
|
|
self.transpose_method = None
|
|
|
|
# We don't need EXIF any more
|
|
|
|
self.image.info["exif"] = None
|
|
|
|
return self.image.size
|
2014-12-05 09:12:37 -07:00
|
|
|
|
2021-01-15 08:57:37 -07:00
|
|
|
def aspect(self, max_width: int, max_height: int) -> Tuple[int, int]:
|
2014-12-05 09:12:37 -07:00
|
|
|
"""Calculate the largest size that preserves aspect ratio which
|
|
|
|
fits within the given rectangle::
|
|
|
|
|
|
|
|
(w_in / h_in) = (w_out / h_out)
|
2021-11-10 13:49:43 -07:00
|
|
|
w_out = max(min(w_max, h_max * (w_in / h_in)), 1)
|
|
|
|
h_out = max(min(h_max, w_max * (h_in / w_in)), 1)
|
2014-12-05 09:12:37 -07:00
|
|
|
|
|
|
|
Args:
|
|
|
|
max_width: The largest possible width.
|
2020-09-14 09:46:58 -06:00
|
|
|
max_height: The largest possible height.
|
2014-12-05 09:12:37 -07:00
|
|
|
"""
|
|
|
|
|
|
|
|
if max_width * self.height < max_height * self.width:
|
2021-11-10 13:49:43 -07:00
|
|
|
return max_width, max((max_width * self.height) // self.width, 1)
|
2014-12-05 09:12:37 -07:00
|
|
|
else:
|
2021-11-10 13:49:43 -07:00
|
|
|
return max((max_height * self.width) // self.height, 1), max_height
|
2014-12-05 09:12:37 -07:00
|
|
|
|
2021-10-08 07:49:41 -06:00
|
|
|
def _resize(self, width: int, height: int) -> Image.Image:
|
2019-10-04 02:34:52 -06:00
|
|
|
# 1-bit or 8-bit color palette images need converting to RGB
|
|
|
|
# otherwise they will be scaled using nearest neighbour which
|
2021-03-09 05:37:09 -07:00
|
|
|
# looks awful.
|
|
|
|
#
|
|
|
|
# If the image has transparency, use RGBA instead.
|
|
|
|
if self.image.mode in ["1", "L", "P"]:
|
|
|
|
if self.image.info.get("transparency", None) is not None:
|
2022-06-01 04:57:49 -06:00
|
|
|
with self.image:
|
|
|
|
self.image = self.image.convert("RGBA")
|
2022-05-09 04:48:14 -06:00
|
|
|
else:
|
2022-06-01 04:57:49 -06:00
|
|
|
with self.image:
|
|
|
|
self.image = self.image.convert("RGB")
|
2023-07-05 02:52:12 -06:00
|
|
|
return self.image.resize((width, height), Image.LANCZOS)
|
2019-10-04 02:34:52 -06:00
|
|
|
|
2023-07-05 09:22:21 -06:00
|
|
|
@trace
|
2021-01-15 08:57:37 -07:00
|
|
|
def scale(self, width: int, height: int, output_type: str) -> BytesIO:
|
2017-10-12 10:31:24 -06:00
|
|
|
"""Rescales the image to the given dimensions.
|
|
|
|
|
|
|
|
Returns:
|
2022-11-16 08:25:24 -07:00
|
|
|
The bytes of the encoded image ready to be written to disk
|
2017-10-12 10:31:24 -06:00
|
|
|
"""
|
2022-06-01 04:57:49 -06:00
|
|
|
with self._resize(width, height) as scaled:
|
|
|
|
return self._encode_image(scaled, output_type)
|
2014-12-05 09:12:37 -07:00
|
|
|
|
2023-07-05 09:22:21 -06:00
|
|
|
@trace
|
2021-01-15 08:57:37 -07:00
|
|
|
def crop(self, width: int, height: int, output_type: str) -> BytesIO:
|
2014-12-05 09:12:37 -07:00
|
|
|
"""Rescales and crops the image to the given dimensions preserving
|
|
|
|
aspect::
|
|
|
|
(w_in / h_in) = (w_scaled / h_scaled)
|
|
|
|
w_scaled = max(w_out, h_out * (w_in / h_in))
|
|
|
|
h_scaled = max(h_out, w_out * (h_in / w_in))
|
|
|
|
|
|
|
|
Args:
|
|
|
|
max_width: The largest possible width.
|
2020-09-14 09:46:58 -06:00
|
|
|
max_height: The largest possible height.
|
2017-10-12 10:31:24 -06:00
|
|
|
|
|
|
|
Returns:
|
2022-11-16 08:25:24 -07:00
|
|
|
The bytes of the encoded image ready to be written to disk
|
2014-12-05 09:12:37 -07:00
|
|
|
"""
|
|
|
|
if width * self.height > height * self.width:
|
2022-06-01 04:57:49 -06:00
|
|
|
scaled_width = width
|
2014-12-05 09:12:37 -07:00
|
|
|
scaled_height = (width * self.height) // self.width
|
|
|
|
crop_top = (scaled_height - height) // 2
|
|
|
|
crop_bottom = height + crop_top
|
2022-06-01 04:57:49 -06:00
|
|
|
crop = (0, crop_top, width, crop_bottom)
|
2014-12-05 09:12:37 -07:00
|
|
|
else:
|
|
|
|
scaled_width = (height * self.width) // self.height
|
2022-06-01 04:57:49 -06:00
|
|
|
scaled_height = height
|
2014-12-05 09:12:37 -07:00
|
|
|
crop_left = (scaled_width - width) // 2
|
|
|
|
crop_right = width + crop_left
|
2022-06-01 04:57:49 -06:00
|
|
|
crop = (crop_left, 0, crop_right, height)
|
|
|
|
|
|
|
|
with self._resize(scaled_width, scaled_height) as scaled_image:
|
|
|
|
with scaled_image.crop(crop) as cropped:
|
|
|
|
return self._encode_image(cropped, output_type)
|
2014-12-10 07:46:55 -07:00
|
|
|
|
2021-10-08 07:49:41 -06:00
|
|
|
def _encode_image(self, output_image: Image.Image, output_type: str) -> BytesIO:
|
2017-10-13 04:33:49 -06:00
|
|
|
output_bytes_io = BytesIO()
|
2019-12-02 05:12:55 -07:00
|
|
|
fmt = self.FORMATS[output_type]
|
|
|
|
if fmt == "JPEG":
|
|
|
|
output_image = output_image.convert("RGB")
|
|
|
|
output_image.save(output_bytes_io, fmt, quality=80)
|
2017-10-12 08:20:59 -06:00
|
|
|
return output_bytes_io
|
2022-06-01 04:57:49 -06:00
|
|
|
|
|
|
|
def close(self) -> None:
|
|
|
|
"""Closes the underlying image file.
|
|
|
|
|
|
|
|
Once closed no other functions can be called.
|
|
|
|
|
|
|
|
Can be called multiple times.
|
|
|
|
"""
|
|
|
|
|
|
|
|
if self._closed:
|
|
|
|
return
|
|
|
|
|
|
|
|
self._closed = True
|
|
|
|
|
|
|
|
# Since we run this on the finalizer then we need to handle `__init__`
|
|
|
|
# raising an exception before it can define `self.image`.
|
|
|
|
image = getattr(self, "image", None)
|
|
|
|
if image is None:
|
|
|
|
return
|
|
|
|
|
|
|
|
image.close()
|
|
|
|
|
|
|
|
def __enter__(self) -> "Thumbnailer":
|
|
|
|
"""Make `Thumbnailer` a context manager that calls `close` on
|
|
|
|
`__exit__`.
|
|
|
|
"""
|
|
|
|
return self
|
|
|
|
|
|
|
|
def __exit__(
|
|
|
|
self,
|
|
|
|
type: Optional[Type[BaseException]],
|
|
|
|
value: Optional[BaseException],
|
|
|
|
traceback: Optional[TracebackType],
|
|
|
|
) -> None:
|
|
|
|
self.close()
|
|
|
|
|
|
|
|
def __del__(self) -> None:
|
|
|
|
# Make sure we actually do close the image, rather than leak data.
|
|
|
|
self.close()
|