"""
Internal module implementing multi-media objects and utilities in MLflow. Multi-media objects are
exposed to users at the top-level :py:mod:`mlflow` module.
"""
import warnings
from typing import TYPE_CHECKING, Optional, Union
if TYPE_CHECKING:
import numpy
import PIL
COMPRESSED_IMAGE_SIZE = 256
def compress_image_size(
image: "PIL.Image.Image", max_size: Optional[int] = COMPRESSED_IMAGE_SIZE
) -> "PIL.Image.Image":
"""
Scale the image to fit within a square with length `max_size` while maintaining
the aspect ratio.
"""
# scale the image to max(width, height) <= compressed_file_max_size
width, height = image.size
if width > height:
new_width = max_size
new_height = int(height * (new_width / width))
else:
new_height = max_size
new_width = int(width * (new_height / height))
return image.resize((new_width, new_height))
def convert_to_pil_image(image: Union["numpy.ndarray", list]) -> "PIL.Image.Image":
"""
Convert a numpy array to a PIL image.
"""
import numpy as np
try:
from PIL import Image
except ImportError as exc:
raise ImportError(
"Pillow is required to serialize a numpy array as an image. "
"Please install it via: `pip install Pillow`"
) from exc
def _normalize_to_uint8(x):
is_int = np.issubdtype(x.dtype, np.integer)
low = 0
high = 255 if is_int else 1
if x.min() < low or x.max() > high:
if is_int:
raise ValueError(
"Integer pixel values out of acceptable range [0, 255]. "
f"Found minimum value {x.min()} and maximum value {x.max()}. "
"Ensure all pixel values are within the specified range."
)
else:
warnings.warn(
"Float pixel values out of acceptable range [0.0, 1.0]. "
f"Found minimum value {x.min()} and maximum value {x.max()}. "
"Rescaling values to [0.0, 1.0] with min/max scaler.",
stacklevel=2,
)
# Min-max scaling
x = (x - x.min()) / (x.max() - x.min())
# float or bool
if not is_int:
x = x * 255
return x.astype(np.uint8)
# Ref.: https://numpy.org/doc/stable/reference/generated/numpy.dtype.kind.html#numpy-dtype-kind
valid_data_types = {
"b": "bool",
"i": "signed integer",
"u": "unsigned integer",
"f": "floating",
}
if image.dtype.kind not in valid_data_types:
raise TypeError(
f"Invalid array data type: '{image.dtype}'. "
f"Must be one of {list(valid_data_types.values())}"
)
if image.ndim not in [2, 3]:
raise ValueError(f"`image` must be a 2D or 3D array but got image shape: {image.shape}")
if (image.ndim == 3) and (image.shape[2] not in [1, 3, 4]):
raise ValueError(f"Invalid channel length: {image.shape[2]}. Must be one of [1, 3, 4]")
# squeeze a 3D grayscale image since `Image.fromarray` doesn't accept it.
if image.ndim == 3 and image.shape[2] == 1:
image = image[:, :, 0]
image = _normalize_to_uint8(image)
return Image.fromarray(image)
# MLflow media object: Image
[docs]class Image:
"""
`mlflow.Image` is an image media object that provides a lightweight option
for handling images in MLflow.
The image can be a numpy array, a PIL image, or a file path to an image. The image is
stored as a PIL image and can be logged to MLflow using `mlflow.log_image` or
`mlflow.log_table`.
Args:
image: Image can be a numpy array, a PIL image, or a file path to an image.
.. code-block:: python
:caption: Example
import mlflow
import numpy as np
from PIL import Image
# Create an image as a numpy array
image = np.zeros((100, 100, 3), dtype=np.uint8)
image[:, :50] = [255, 128, 0]
# Create an Image object
image_obj = mlflow.Image(image)
# Convert the Image object to a list of pixel values
pixel_values = image_obj.to_list()
"""
def __init__(self, image: Union["numpy.ndarray", "PIL.Image.Image", str, list]):
import numpy as np
try:
from PIL import Image
except ImportError as exc:
raise ImportError(
"`mlflow.Image` requires Pillow to serialize a numpy array as an image. "
"Please install it via: `pip install Pillow`."
) from exc
if isinstance(image, str):
self.image = Image.open(image)
elif isinstance(image, (list, np.ndarray)):
self.image = convert_to_pil_image(np.array(image))
elif isinstance(image, Image.Image):
self.image = image
else:
raise TypeError(
f"Unsupported image object type: {type(image)}. "
"`image` must be one of numpy.ndarray, "
"PIL.Image.Image, or a filepath to an image."
)
self.size = self.image.size
[docs] def to_list(self):
"""
Convert the image to a list of pixel values.
Returns:
List of pixel values.
"""
return list(self.image.getdata())
[docs] def to_array(self):
"""
Convert the image to a numpy array.
Returns:
Numpy array of pixel values.
"""
import numpy as np
return np.array(self.image)
[docs] def to_pil(self):
"""
Convert the image to a PIL image.
Returns:
PIL image.
"""
return self.image
[docs] def save(self, path: str):
"""
Save the image to a file.
Args:
path: File path to save the image.
"""
self.image.save(path)
[docs] def resize(self, size: tuple[int, int]):
"""
Resize the image to the specified size.
Args:
size: Size to resize the image to.
Returns:
A copy of the resized image object.
"""
image = self.image.resize(size)
return Image(image)