# Copyright (C) 2021-2024, Mindee.# This program is licensed under the Apache License 2.0.# See LICENSE or go to <https://opensource.org/licenses/Apache-2.0> for full license details.fromtypingimportTupleimportnumpyasnpimporttensorflowastffromPILimportImagefromtensorflow.keras.utilsimportimg_to_arrayfromdoctr.utils.common_typesimportAbstractPath__all__=["tensor_from_pil","read_img_as_tensor","decode_img_as_tensor","tensor_from_numpy","get_img_shape"]deftensor_from_pil(pil_img:Image.Image,dtype:tf.dtypes.DType=tf.float32)->tf.Tensor:"""Convert a PIL Image to a TensorFlow tensor Args: pil_img: a PIL image dtype: the output tensor data type Returns: decoded image as tensor """npy_img=img_to_array(pil_img)returntensor_from_numpy(npy_img,dtype)
[docs]defread_img_as_tensor(img_path:AbstractPath,dtype:tf.dtypes.DType=tf.float32)->tf.Tensor:"""Read an image file as a TensorFlow tensor Args: img_path: location of the image file dtype: the desired data type of the output tensor. If it is float-related, values will be divided by 255. Returns: decoded image as a tensor """ifdtypenotin(tf.uint8,tf.float16,tf.float32):raiseValueError("insupported value for dtype")img=tf.io.read_file(img_path)img=tf.image.decode_jpeg(img,channels=3)ifdtype!=tf.uint8:img=tf.image.convert_image_dtype(img,dtype=dtype)img=tf.clip_by_value(img,0,1)returnimg
[docs]defdecode_img_as_tensor(img_content:bytes,dtype:tf.dtypes.DType=tf.float32)->tf.Tensor:"""Read a byte stream as a TensorFlow tensor Args: img_content: bytes of a decoded image dtype: the desired data type of the output tensor. If it is float-related, values will be divided by 255. Returns: decoded image as a tensor """ifdtypenotin(tf.uint8,tf.float16,tf.float32):raiseValueError("insupported value for dtype")img=tf.io.decode_image(img_content,channels=3)ifdtype!=tf.uint8:img=tf.image.convert_image_dtype(img,dtype=dtype)img=tf.clip_by_value(img,0,1)returnimg
deftensor_from_numpy(npy_img:np.ndarray,dtype:tf.dtypes.DType=tf.float32)->tf.Tensor:"""Read an image file as a TensorFlow tensor Args: npy_img: image encoded as a numpy array of shape (H, W, C) in np.uint8 dtype: the desired data type of the output tensor. If it is float-related, values will be divided by 255. Returns: same image as a tensor of shape (H, W, C) """ifdtypenotin(tf.uint8,tf.float16,tf.float32):raiseValueError("insupported value for dtype")ifdtype==tf.uint8:img=tf.convert_to_tensor(npy_img,dtype=dtype)else:img=tf.image.convert_image_dtype(npy_img,dtype=dtype)img=tf.clip_by_value(img,0,1)returnimgdefget_img_shape(img:tf.Tensor)->Tuple[int,int]:"""Get the shape of an image"""returnimg.shape[:2]