enhance_image_skimage.py

import os
import math
import rawpy
import cv2
import numpy as np

from tqdm import tqdm
from skimage.color import rgb2gray
from skimage import img_as_float
from glob import glob
from argparse import ArgumentParser
from imutils.paths import list_images

sp = os.path.sep


class Enhancer(object):
    def __init__(self, parameters: dict):

        self.parameters = parameters
        self.adjust_parameters()

    def adjust_parameters(self):

        if "local_contrast" in self.parameters:
            self.parameters["local_contrast"] = float(self.parameters["local_contrast"])
            if self.parameters["local_contrast"] < 0:
                self.parameters["local_contrast"] = 0
        else:
            self.parameters["local_contrast"] = 1.2  # default: slight increase

        if "mid_tones" in self.parameters:
            self.parameters["mid_tones"] = float(self.parameters["mid_tones"])
            if self.parameters["mid_tones"] > 1:
                self.parameters["mid_tones"] = 1
            if self.parameters["mid_tones"] < 0:
                self.parameters["mid_tones"] = 0
        else:
            self.parameters["mid_tones"] = 0.5  # default: middle of the range

        if "tonal_width" in self.parameters:
            self.parameters["tonal_width"] = float(self.parameters["tonal_width"])
            if self.parameters["tonal_width"] > 1:
                self.parameters["tonal_width"] = 1
            if self.parameters["tonal_width"] < 0:
                self.parameters["tonal_width"] = 0
        else:
            self.parameters["tonal_width"] = 0.5  # default: middle of the range

        if "areas_dark" in self.parameters:
            self.parameters["areas_dark"] = float(self.parameters["areas_dark"])
            if self.parameters["areas_dark"] > 1:
                self.parameters["areas_dark"] = 1
            if self.parameters["areas_dark"] < 0:
                self.parameters["areas_dark"] = 0
        else:
            self.parameters["areas_dark"] = 0.2  # default: gentle increase

        if "areas_bright" in self.parameters:
            self.parameters["areas_bright"] = float(self.parameters["areas_bright"])
            if self.parameters["areas_bright"] > 1:
                self.parameters["areas_bright"] = 1
            if self.parameters["areas_bright"] < 0:
                self.parameters["areas_bright"] = 0
        else:
            self.parameters["areas_bright"] = 0.2  # default: gentle increase

        if "brightness" in self.parameters:
            self.parameters["brightness"] = float(self.parameters["brightness"])
            if self.parameters["brightness"] > 1:
                self.parameters["brightness"] = 1
            if self.parameters["brightness"] < -1:
                self.parameters["brightness"] = -1
        else:
            self.parameters["brightness"] = 0.1  # default: gentle increase

        if "preserve_tones" in self.parameters:
            self.parameters["preserve_tones"] = bool(self.parameters["preserve_tones"])
        else:
            self.parameters["preserve_tones"] = True  # default: preserve tones

        if "color_correction" in self.parameters:
            self.parameters["color_correction"] = bool(
                self.parameters["color_correction"]
            )
        else:
            self.parameters["color_correction"] = False  # default: no correction

        if "saturation_degree" in self.parameters:
            self.parameters["saturation_degree"] = float(
                self.parameters["saturation_degree"]
            )
            if self.parameters["saturation_degree"] < 0:
                self.parameters["saturation_degree"] = 0
        else:
            self.parameters["saturation_degree"] = 1.2  # default: slight increase

    def map_value(
        self,
        value,
        range_in=(0, 1),
        range_out=(0, 1),
        invert=False,
        non_lin_convex=None,
        non_lin_concave=None,
    ):

        """
        ---------------------------------------------------------------------------
        Map a scalar value to an output range in a linear/non-linear way
        ---------------------------------------------------------------------------

        Map scalar values to a particular range, in a linear or non-linear way.
        This can be helpful for adjusting the range and nonlinear response of
        parameters.

        For more info on the non-linear functions check:
        Vonikakis, V., Winkler, S. (2016). A center-surround framework for spatial
        image processing. Proc. IS&T Human Vision & Electronic Imaging.


        INPUTS
        ------
        value: float
            Input value to be mapped.
        range_in: tuple (min,max)
            Range of input value. The min and max values that the input value can
            attain.
        range_out: tuple (min,max)
            Range of output value. The min and max values that the mapped input
            value can attain.
        invert: Bool
            Invert or not the input value. If invert, then min->max and max->min.
        non_lin_convex: None or float (0,inf)
            If None, no non-linearity is applied. If float, then a convex
            non-linearity is applied, which lowers the values, while not affecting
            the min and max. non_lin_convex controls the steepness of the
            non-linear mapping. Small values near zero, result in a steeper curve.
        non_lin_concave: None or float (0,inf)
            If None, no non-linearity is applied. If float, then a concave
            non-linearity is applied, which increases the values, while not
            affecting min and max. non_lin_concave controls the steepness of the
            non-linear mapping. Small values near zero, result in a steeper curve.

        OUTPUT
        ------
        Mapped value

        """

        # truncate value to within input range limits
        if value > range_in[1]:
            value = range_in[1]
        if value < range_in[0]:
            value = range_in[0]

        # map values linearly to [0,1]
        value = (value - range_in[0]) / (range_in[1] - range_in[0])

        # invert values
        if invert is True:
            value = 1 - value

        # apply convex non-linearity
        if non_lin_convex is not None:
            value = (value * non_lin_convex) / (1 + non_lin_convex - value)

        # apply concave non-linearity
        if non_lin_concave is not None:
            value = ((1 + non_lin_concave) * value) / (non_lin_concave + value)

        # mapping value to the output range in a linear way
        value = value * (range_out[1] - range_out[0]) + range_out[0]

        return value

    def srgb_to_linear(self, image_srgb):

        """
        ---------------------------------------------------------------------------
                Transform an image from sRGB color space to linear
        ---------------------------------------------------------------------------

        The function undos the main non-linearities associated with the sRGB color
        space, in order to approximate a linear color response. Note that the
        linear image output will look darker, because the gamma correction will be
        undone. The transformation formulas can be found in the EasyRGB website:
        https://www.easyrgb.com/en/math.php

        Note that the formulas may look slightly different. This is because they
        have been altered in order to implement them in a vectorized way, avoiding
        for loops. As such, an image is partitioned in 2 parts image_upper and
        image_lower, which implement separate parts of the piece-wise color
        transformation formula.


        INPUTS
        ------
        image_srgb: numpy array of WxHx3 of uint8 [0,255]
            Input color image with values in the interval [0,255]. Assuming that
            it is encoded on the sRGB color space. The code will still work if the
            input image is grayscale or within [0,1] range.

        OUTPUT
        ------
        image_linear: numpy array of WxHx3 of float [0,1]
            Output color linear image with values in the interval [0,1]. Gamma has
            been removed, so it looks darker.

        """

        # dealing with different input dimensions
        dimensions = len(image_srgb.shape)
        if dimensions == 1:
            image_srgb = np.expand_dims(image_srgb, axis=2)  # make a 3rd dimension

        image_srgb = img_as_float(image_srgb)  # [0,1]

        # lower part of the piecewise formula
        image_lower = image_srgb.copy()
        image_lower[image_lower > 0.04045] = 0
        image_lower = image_lower / 12.92

        # upper part of the piecewise formula
        image_upper = image_srgb.copy()
        image_upper = image_upper + 0.055
        image_upper[image_upper <= (0.04045 + 0.055)] = 0
        image_upper = image_upper / 1.055
        image_upper = image_upper**2.4

        image_linear = image_lower + image_upper  # combine into the final result

        return image_linear

    def linear_to_srgb(self, image_linear):

        """
        ---------------------------------------------------------------------------
                Transform an image from linear to sRGB color space
        ---------------------------------------------------------------------------

        The function re-applies the main non-linearities associated with the sRGB
        color space. The transformation formula can be found in EasyRGB website:
        https://www.easyrgb.com/en/math.php

        Note that the formulas may look slightly different. This is because they
        have been altered in order to implement them in a vectorized way, avoiding
        for loops. As such, an image is partitioned in 2 parts image_upper and
        image_lower, which implement separate parts of the piece-wise color
        transformation formula.


        INPUTS
        ------
        image_linear: numpy array of WxHx3 of float [0,1]
            Input color image with values in the interval [0,1].

        OUTPUT
        ------
        image_srgb: numpy array of WxHx3 of uint8 [0,255]
            Output color sRGB image with values in the interval [0,255].

        """

        # dealing with different input dimensions
        dimensions = len(image_linear.shape)
        if dimensions == 1:
            image_linear = np.expand_dims(image_linear, axis=2)  # 3rd dimension

        image_linear = img_as_float(image_linear)  # [0,1]

        # lower part of the piecewise formula
        image_lower = image_linear.copy()
        image_lower[image_lower > 0.0031308] = 0
        image_lower = image_lower * 12.92

        # upper part of the piecewise formula
        image_upper = image_linear.copy()
        image_upper[image_upper <= 0.0031308] = 0
        image_upper = image_upper ** (1 / 2.4)
        image_upper = image_upper * 1.055
        image_upper = image_upper - 0.055

        image_srgb = image_lower + image_upper
        image_srgb = np.clip(a=image_srgb, a_min=0, a_max=1, out=image_srgb)

        return (image_srgb * 255).astype(np.uint8)

    def get_sigmoid_lut(self, resolution=256, threshold=0.2, non_linearirty=0.2):
        """
        ---------------------------------------------------------------------------
        Creates a paramteric sigmoid function and stores it in a LUT
        ---------------------------------------------------------------------------

        The sigmoid function is defined as a piece-wise function of 2 inverse
        non-linearities. This allows full control of the inflection point
        (threshold) and the degree of 'sharpness' of each non-linearity. The
        non-linear curves used here are described in the paper:
        Vonikakis, V., Winkler, S. (2016). A center-surround framework for spatial
        image processing. Proc. IS&T Human Vision & Electronic Imaging.

        LUT = Look Up Table

        INPUTS
        ------
        resolution: int
            The size of the LUT (how many inputs).
        threshold: float in the range [0,1]
            The position of the inflection point of the sigmoid function (0.5 in
            the mid_tonedle of the range).
        non_linearirty: float in range (0, inf)
            Controls the non-linearity of the curve before and after the inflection
            point. It should not be 0. The smaller it is (asymptotically to 0) the
            'sharper' the non-linearity. After ~5 it asymptotically approaches a
            linerity.

        OUTPUT
        ------
        lut: float numpy array of size equal to resolution
            The output sigmoid lut.

        """

        max_value = resolution - 1  # the maximum attainable value
        thr = threshold * max_value  # threshold in the range [0,resolution-1]
        alpha = non_linearirty * max_value  # controls non-linearity degree
        beta = max_value - thr
        if beta == 0:
            beta = 0.001

        lut = np.zeros(resolution, dtype="float")

        for i in range(resolution):

            i_comp = i - thr  # complement of i

            # upper part of the piece-wise sigmoid function
            if i >= thr:
                lut[i] = (
                    (((alpha + beta) * i_comp) / (alpha + i_comp)) * (1 / (2 * beta))
                ) + 0.5

            # lower part of the piece-wise sigmoid function
            else:
                lut[i] = (alpha * i) / (alpha - i_comp) * (1 / (2 * thr))

        return lut

    def get_membership_luts(
        self, resolution=256, lower_threshold=0.35, upper_threshold=0.65
    ):

        """
        ---------------------------------------------------------------------------
        Creates 3 paramteric traspezoid membership functions
        ---------------------------------------------------------------------------

        The trapezoid functions are defined as piece-wise functions between the
        0, lower_threshold, upper_threshold, 1. These trapezoid membership
        functions can be used to filter out which parts of each exposure to be
        used during exposure fusion. More details can be found in the following
        paper:

        Vonikakis, V., Bouzos, O. & Andreadis, I. (2011). Multi-Exposure Image
        Fusion Based on Illumination Estimation, SIPA2011 (pp.135-142), Greece.


        INPUTS
        ------
        resolution: int
            The size of the LUT (how many inputs).
        lower_threshold: float in the range [0,1]
            The position of the lower inflection point of the trapezoid functions.
            It should be always lower compared to the upper_threshold.
        upper_threshold: float in the range [0,1]
            The position of the upper inflection point of the trapezoid functions.
            It should be always higher compared to the lower_threshold.

        OUTPUT
        ------
        lut_lower: float numpy array of size equal to resolution, values in [0,1]
            The lower trepezoid membership function.
        lut_mid: float numpy array of size equal to resolution, values in [0,1]
            The middle trepezoid membership function.
        lut_upper float numpy array of size equal to resolution, values in [0,1]
            The upper trepezoid membership function.

        """

        lut_lower = np.zeros(resolution, dtype="float")
        lut_mid = np.zeros(resolution, dtype="float")
        lut_upper = np.zeros(resolution, dtype="float")

        for i in range(resolution):

            i_float = i / (resolution - 1)

            # lower trapezoid membership function
            if i_float <= lower_threshold:
                lut_lower[i] = i_float / lower_threshold
            else:
                lut_lower[i] = 1

            # middle trapezoid membership function
            if i_float <= lower_threshold:
                lut_mid[i] = i_float / lower_threshold
            elif i_float <= upper_threshold:
                lut_mid[i] = 1
            else:
                lut_mid[i] = (1 - i_float) / (1 - upper_threshold)

            # upper trapezoid membership function
            if i_float <= upper_threshold:
                lut_upper[i] = 1
            else:
                lut_upper[i] = (1 - i_float) / (1 - upper_threshold)

        return lut_lower, lut_mid, lut_upper

    def get_photometric_mask(
        self, image: np.ndarray, smoothing=0.2, grayscale_out=True
    ):
        """
        ---------------------------------------------------------------------------
        Estimate the photometric mask of an image by using edge-aware blurring
        ---------------------------------------------------------------------------

        Applies strong blurring while preserving the strong edges of the image in
        order to avoid halo artifacts. Inspired by the paper:
        Shaked, Doron & Keshet, Renato. (2004). "Robust Recursive Envelope
        Operators for Fast Retinex."


        INPUTS
        ------
        image: numpy array (WxH or WxHxK of uint8 [0.255] or float [0,1])
            Input image.
        smoothing: float in the interval [0,1]
            Value controlling the blur's strenght. 0 indicates no blur. Values
            between 0-1 increase blurring strength while preserving edges. Values
            above 1 approximate very strong gaussian blurring (large sigmas) where
            no edges are preserved. Practically, values above 10 result into a
            uniform image.
        grayscale_out: logical
            Whether or not the photometric mask is going to be grayscale or not.
            If the input image is already grayscale (2D) then this parameter is
            irrelevant.

        OUTPUT
        ------
        image_ph_mask: numpy array of WxH or WxHxK of float [0,1]
            Photometric mask of the input image.

        Intuition about the threshold and non_linearirty values of the LUTs
        threshold:
            The larger it is, the stronger the blurring, the better the local
            contrast but also more halo artifacts (less edge preservation).
        non_linearirty:
            The lower it is, the more it preserves the edges, but also has more
            'bleeding' effects.
        """

        # internal parameters
        THR_A = smoothing
        THR_B = 0.04  # ~10/255
        NON_LIN = 0.12  # ~30/255
        LUT_RES = 256

        # get sigmoid LUTs
        lut_a = self.get_sigmoid_lut(
            resolution=LUT_RES, threshold=THR_A, non_linearirty=NON_LIN
        )
        lut_a_max = len(lut_a) - 1
        lut_b = self.get_sigmoid_lut(
            resolution=LUT_RES, threshold=THR_B, non_linearirty=NON_LIN
        )
        lut_b_max = len(lut_b) - 1

        # dealing with different number of channels
        if len(image.shape) == 3:
            if grayscale_out is True:
                image_ph_mask = rgb2gray(image.copy())  # [0,1] 2D
            else:
                image_ph_mask = img_as_float(image.copy())  # [0,1] 3D
        elif len(image.shape) == 2:
            image_ph_mask = img_as_float(image.copy())  # [0,1] 2D
        else:
            image_ph_mask = img_as_float(image.copy())  # [0,1] ?D

        # if image is 2D, expand dimensions to 3D for code compatibility
        # (filtering assumes a 3D image)
        if len(image_ph_mask.shape) == 2:
            image_ph_mask = np.expand_dims(image_ph_mask, axis=2)

        # up -> down
        for i in range(1, image_ph_mask.shape[0] - 1):
            d = np.abs(image_ph_mask[i - 1, :, :] - image_ph_mask[i + 1, :, :])  # diff
            d = lut_a[(d * lut_a_max).astype(int)]
            image_ph_mask[i, :, :] = (image_ph_mask[i, :, :] * d) + (
                image_ph_mask[i - 1, :, :] * (1 - d)
            )

        # left -> right
        for j in range(1, image_ph_mask.shape[1] - 1):
            d = np.abs(image_ph_mask[:, j - 1, :] - image_ph_mask[:, j + 1, :])  # diff
            d = lut_a[(d * lut_a_max).astype(int)]
            image_ph_mask[:, j, :] = (image_ph_mask[:, j, :] * d) + (
                image_ph_mask[:, j - 1, :] * (1 - d)
            )

        # down -> up
        for i in range(image_ph_mask.shape[0] - 2, 1, -1):
            d = np.abs(image_ph_mask[i - 1, :, :] - image_ph_mask[i + 1, :, :])  # diff
            d = lut_a[(d * lut_a_max).astype(int)]
            image_ph_mask[i, :, :] = (image_ph_mask[i, :, :] * d) + (
                image_ph_mask[i + 1, :, :] * (1 - d)
            )

        # right -> left
        for j in range(image_ph_mask.shape[1] - 2, 1, -1):
            d = np.abs(image_ph_mask[:, j - 1, :] - image_ph_mask[:, j + 1, :])  # diff
            d = lut_b[(d * lut_b_max).astype(int)]
            image_ph_mask[:, j, :] = (image_ph_mask[:, j, :] * d) + (
                image_ph_mask[:, j + 1, :] * (1 - d)
            )

        # up -> down
        for i in range(1, image_ph_mask.shape[0] - 1):
            d = np.abs(image_ph_mask[i - 1, :, :] - image_ph_mask[i + 1, :, :])  # diff
            d = lut_b[(d * lut_b_max).astype(int)]
            image_ph_mask[i, :, :] = (image_ph_mask[i, :, :] * d) + (
                image_ph_mask[i - 1, :, :] * (1 - d)
            )

        # convert back to 2D if grayscale is needed
        if grayscale_out is True:
            image_ph_mask = np.squeeze(image_ph_mask)

        return image_ph_mask

    def apply_local_contrast_enhancement(self, image, image_ph_mask, degree=1.5):
        """
        ---------------------------------------------------------------------------
                        Adjust local contrast in an image
        ---------------------------------------------------------------------------

        Increase or decrease the level of local details (local contrast) in an
        image. Details are defined as deviations from the local neighborhood
        provided by the photometric mask. Dark regions receive also a boost in
        local contrast.


        INPUTS
        ------
        image: numpy array of WxH of float [0,1]
            Input grayscale image.
        image_ph_mask: numpy array of WxH of float [0,1]
            Grayscale image whose values represent the neighborhood of the pixels
            of the input image. Usually, this image some type of edge aware
            filtering, such as bilateral filtering, robust recursive envelopes etc.
        degree: float [0,inf].
            How to change the local contrast.
            0: total attenuation of details.
            <1: attenuation of details
            1: details unchanged
            >1: increased local details

        OUTPUT
        ------
        image_out: numpy array of WxH of float [0,1]
            Output image with adjusted local contrast.

        """

        DARK_BOOST = 0.2
        THRESHOLD_DARK_TONES = 100 / 255
        detail_amplification_global = degree

        image_details = image - image_ph_mask  # image details

        # special treatment for dark regions
        detail_amplification_local = image_ph_mask / THRESHOLD_DARK_TONES
        detail_amplification_local[detail_amplification_local > 1] = 1
        detail_amplification_local = (
            (1 - detail_amplification_local) * DARK_BOOST
        ) + 1  # [1, 1.2]

        # apply all detail adjustements
        image_details = (
            image_details * detail_amplification_global * detail_amplification_local
        )

        # add details back to the local neighborhood
        image_out = image_ph_mask + image_details

        # stay within range
        image_out = np.clip(a=image_out, a_min=0, a_max=1, out=image_out)

        return image_out

    def apply_spatial_tonemapping(
        self,
        image,
        image_ph_mask,
        mid_tone=0.5,
        tonal_width=0.5,
        areas_dark=0.5,
        areas_bright=0.5,
        preserve_tones=True,
    ):
        """
        ---------------------------------------------------------------------------
        Apply spatially variable tone mapping based on the local neighborhood
        ---------------------------------------------------------------------------

        Applies different tone mapping curves in each pixel based on its surround.
        For surround, the photometric mask is used. Alternatively, other filters
        could be used, like gaussian, bilateral filter, edge-avoiding wavelets etc.
        Dark pixels are brightened, bright pixels are darkened, and pixels in the
        mid_tonedle of the tone range are minimally affected. More information
        about the technique can be found in the following papers:

        Related publications:
        Vonikakis, V., Andreadis, I., & Gasteratos, A. (2008). Fast centre-surround
        contrast modification. IET Image processing 2(1), 19-34.
        Vonikakis, V., Winkler, S. (2016). A center-surround framework for spatial
        image processing. Proc. IS&T Human Vision & Electronic Imaging.


        INPUTS
        ------
        image: numpy array of WxH of float [0,1]
            Input grayscale image with values in the interval [0,1].
        image_ph_mask: numpy array of WxH of float [0,1]
            Grayscale image whose values represent the neighborhood of the pixels
            of the input image. Usually, this image some type of edge aware
            filtering, such as bilateral filtering, robust recursive envelopes etc.
        mid_tone: float [0,1]
            The mid point between the 'dark' and 'bright' tones. This is equivalent
            to a pixel value [0,255], but in the interval [0,1].
        tonal_width: float [0,1]
            The range of pixel values that will be affected by the correction.
            Lower values will localize the enhancement only in a narrow range of
            pixel values, whereas for higher values the enhancement will extend to
            a greater range of pixel values.
        areas_dark: float [0,1]
            Degree of enhencement in the dark image areas (0 = no enhencement)
        areas_bright: float [0,1]
            Degree of enhencement in the bright image areas (0 = no enhencement)
        preserve_tones: boolean
            Whether or not to preserve well-exposed tones around the middle of the
            range.

        OUTPUT
        ------
        image_tonemapped: numpy array of WxH of float [0,1]
            Tonemapped grayscale image.

        """

        # defining parameters
        EPSILON = 1 / 256

        # adjust range and non-linear response of parameters
        mid_tone = self.map_value(
            value=mid_tone,
            range_in=(0, 1),
            range_out=(0, 1),
            invert=False,
            non_lin_convex=None,
            non_lin_concave=None,
        )

        tonal_width = self.map_value(
            value=tonal_width,
            range_in=(0, 1),
            range_out=(EPSILON, 1),
            invert=False,
            non_lin_convex=0.1,
            non_lin_concave=None,
        )

        areas_dark = self.map_value(
            value=areas_dark,
            range_in=(0, 1),
            range_out=(0, 5),
            invert=True,
            non_lin_convex=0.05,
            non_lin_concave=None,
        )

        areas_bright = self.map_value(
            value=areas_bright,
            range_in=(0, 1),
            range_out=(0, 5),
            invert=True,
            non_lin_convex=0.05,
            non_lin_concave=None,
        )

        # spatial tone-mapping

        # lower tones (below mid_tone level)
        image_lower = image.copy()
        image_lower[image_lower >= mid_tone] = 0
        alpha = (image_ph_mask**2) / tonal_width
        tone_continuation_factor = mid_tone / (mid_tone + EPSILON - image_ph_mask)
        alpha = alpha * tone_continuation_factor + areas_dark
        image_lower = (image_lower * (alpha + 1)) / (alpha + image_lower)

        # upper tones (above mid_tone level)
        image_upper = image.copy()
        image_upper[image_upper < mid_tone] = 0
        image_ph_mask_inv = 1 - image_ph_mask
        alpha = (image_ph_mask_inv**2) / tonal_width
        tone_continuation_factor = mid_tone / ((1 - mid_tone) - image_ph_mask_inv)
        alpha = alpha * tone_continuation_factor + areas_bright
        image_upper = (image_upper * alpha) / (alpha + 1 - image_upper)

        image_tonemapped = image_lower + image_upper

        if preserve_tones is True:
            preservation_degree = np.abs(0.5 - image_ph_mask) / 0.5  # 0: near 0.5
            #        preservation_degree = ((1 + 0.3) * preservation_degree) / (0.3 + preservation_degree)
            image_tonemapped = (
                preservation_degree * image_tonemapped
                + (1 - preservation_degree) * image
            )

        return image_tonemapped

    def adjust_brightness(self, image, degree=0):
        """
        ---------------------------------------------------------------------------
                    Apply global tone mapping on a grayscale image
        ---------------------------------------------------------------------------

        Applies a single tone mapping curve in all the pixels of a grayscale image.
        Depending on the parameters, the image can be brighten or darken. The set
        of curves used are similar to gamma functions, but are inspired from the
        Naka-Rushton function and exhibit symmetry and better local contrast. More
        information about the technique can be found in the following papers:

        Related publications:
        Vonikakis, V., Winkler, S. (2016). A center-surround framework for spatial
        image processing. Proc. IS&T Human Vision & Electronic Imaging.

        INPUTS
        ------
        image: numpy array of WxH of float [0,1]
            Input grayscale image with values in the interval [0,1].
        degree: float [-1,1]
            The strength of the uniform tone mapping function.
            [-1,0): darken image. Closer to -1 means more agressive darkening
                0: Unchanged tones
            (0,1]: brighten image. Closer to 1 means more agressive brightening

        OUTPUT
        ------
        image_tonemapped: numpy array of WxH of float [0,1]
            Tonemapped grayscale image.

        """

        EPSILON = 1 / 256  # what we consider minimum value

        # adjust range and non-linear response of parameters
        # unpack information: darken or brighten and the degree
        if degree > 0:
            brighten = True
        else:
            brighten = False

        degree = abs(degree)  # [0,1]

        alpha = self.map_value(
            value=degree,
            range_in=(0, 1),
            range_out=(0, 5),  # from the paper: 5x brings close to linear
            invert=True,  # from the paper
            non_lin_convex=0.05,  # adding linearity to the response
            non_lin_concave=None,
        )

        alpha = alpha + EPSILON  # to avoid division by zero

        # applying global tone-mapping
        if degree != 0:
            image_brightness = image.copy()

            if brighten is True:
                image_brightness = (image_brightness * (alpha + 1)) / (
                    alpha + image_brightness
                )
            else:
                image_brightness = (image_brightness * alpha) / (
                    alpha + 1 - image_brightness
                )
        else:
            image_brightness = image

        return image_brightness

    def transfer_graytone_to_color(self, image_color, image_graytone):

        """
        ---------------------------------------------------------------------------
                        Transfer grayscale tones to a color image
        ---------------------------------------------------------------------------

        Transfers the tones of a guide grayscale image to the color version of the
        same image, by using linear color ratios. It first brings the image from
        the sRGB color space back to the linear color space. It estimates color
        ratios of the grayscale color image with the tone-mapped grayscale guide
        image. It then applies the color ratios on the 3 color channels. Finally,
        it brings back the image to the sRGB color space (gamma corrected). Is the
        input image is in another color space (Adobe RGB), a different
        transformation could be used. However, results will not be that much
        different.

        Related publication:
        Chengho Hsin, Zong Wei Lee, Zheng Zhan Lee, and Shaw-Jyh Shin, "Color
        preservation for tone reproduction and image enhancement", Proc. SPIE 9015,
        Color Imaging XIX, 2014


        INPUTS
        ------
        image_color: numpy array of WxHx3 of uint8 [0,255]
            Input color image.
        image_graytone: numpy array of WxH of float [0,1]
            Grayscale version of the image_color which has been tonemapped and it
            will be used as a guide to transfer the same tonemapping to the color
            image.

        OUTPUT
        ------
        image_colortone: numpy array of WxHx3 of uint8 [0,255]
            Output color image with transfered tonemapping.

        """

        EPSILON = 1 / 256

        # bring both color and graytone to linear space
        image_color_linear = self.srgb_to_linear(image_color.copy())
        image_graytone_linear = self.srgb_to_linear(image_graytone.copy())
        image_gray_linear = rgb2gray(image_color_linear.copy())
        image_gray_linear[image_gray_linear == 0] = EPSILON  # for the division later

        # tone ratio of linear images: improved/original
        tone_ratio = image_graytone_linear / image_gray_linear
        #    tone_ratio[np.isinf(tone_ratio)] = 0
        #    tone_ratio[np.isnan(tone_ratio)] = 0

        # apply the tone ratios to the color image
        image_colortone_linear = image_color_linear * np.dstack([tone_ratio] * 3)

        # make sure it's within limits
        image_colortone_linear = np.clip(
            a=image_colortone_linear, a_min=0, a_max=1, out=image_colortone_linear
        )

        # bring back to gamma-corrected sRGB space for visualization
        image_colortone = self.linear_to_srgb(image_colortone_linear)

        return image_colortone

    def correct_colors(self, image):
        """
        ---------------------------------------------------------------------------
                        Correct image colors (remove color casts)
        ---------------------------------------------------------------------------

        Implements a simple color correction using the Gray World Color Assumption
        and White Point Correction.

        Related publication:
        Vonikakis, V., Arapakis, I. & Andreadis, I. (2011). Combining Gray-World
        assumption, White-Point correction and power transformation for automatic
        white balance. International Workshop on Advanced Image Technology (IWAIT),
        paper number 1569353295, Jakarta Indonesia.

        INPUTS
        ------
        image: numpy array of WxHx3 of uint8 [0,255]
            Input color image.

        OUTPUT
        ------
        image_out: numpy array of WxHx3 of float [0,1]
            Output image with adjusted colors.

        """

        image_out = img_as_float(image.copy())  # [0,1]

        #    # simple gray world color correction
        #    image_out[:,:,0] = (image_out[:,:,0] / image_out[:,:,0].mean()) * 0.5
        #    image_out[:,:,1] = (image_out[:,:,1] / image_out[:,:,1].mean()) * 0.5
        #    image_out[:,:,2] = (image_out[:,:,2] / image_out[:,:,2].mean()) * 0.5

        # mean of all channels
        image_mean = (
            image_out[:, :, 0].mean()
            + image_out[:, :, 1].mean()
            + image_out[:, :, 2].mean()
        ) / 3

        # logarithm base to which each channel will be raised
        base_r = image_out[:, :, 0].mean() / image_out[:, :, 0].max()
        base_g = image_out[:, :, 1].mean() / image_out[:, :, 1].max()
        base_b = image_out[:, :, 2].mean() / image_out[:, :, 2].max()

        # the power to which each channel will be raised
        power_r = math.log(image_mean, base_r)
        power_g = math.log(image_mean, base_g)
        power_b = math.log(image_mean, base_b)

        # separately applying different color correction powers to each channel
        image_out[:, :, 0] = (image_out[:, :, 0] / image_out[:, :, 0].max()) ** power_r
        image_out[:, :, 1] = (image_out[:, :, 1] / image_out[:, :, 1].max()) ** power_g
        image_out[:, :, 2] = (image_out[:, :, 2] / image_out[:, :, 2].max()) ** power_b

        return image_out

    def change_color_saturation(self, image_color, image_ph_mask=None, sat_degree=1.5):

        """
        ---------------------------------------------------------------------------
                        Adjust color saturation of an image
        ---------------------------------------------------------------------------

        Increase or decrease the saturation (vibrance) of colors in an image. This
        implements a simpler approach rather than using the HSV color space to
        adjust S. In my experiments HSV-based saturation adjustment was not as good
        and it exhibited some kind of 'color noise'. This approach is aesthetically
        better. The use of photometric_mask is optional, in case you would like to
        treat dark areas (where saturation is usually lower) differently.


        INPUTS
        ------
        image_color: numpy array of WxHx3 of float [0,1]
            Input color image.
        image_ph_mask: numpy array of WxH of float [0,1] or None
            Grayscale image whose values represent the neighborhood of the pixels
            of the input image. If None, saturation adjustment is applied globally
            to all pixels. If not None, then dark regions are treated differently
            and get an additional boost in saturation.

        sat_degree': float [0,inf].
            How to change the color saturation. 0: no color (grayscale),
            <1: reduced color saturation, 1: color saturation unchanged
            >1: increased color saturation

        OUTPUT
        ------
        image_new_sat: numpy array of WxHx3 of float [0,1]
            Output image with adjusted saturation.

        """

        LOCAL_BOOST = 0.2
        THRESHOLD_DARK_TONES = 100 / 255

        image_color = img_as_float(image_color)  # [0,1]

        # define gray scale
        image_gray = (
            image_color[:, :, 0] + image_color[:, :, 1] + image_color[:, :, 2]
        ) / 3
        image_gray = np.dstack([image_gray] * 3)  # grayscale with 3 channels

        image_delta = image_color - image_gray  # deviations from gray

        # defining local color amplification degree
        if image_ph_mask is not None:
            detail_amplification_local = image_ph_mask / THRESHOLD_DARK_TONES
            detail_amplification_local[detail_amplification_local > 1] = 1
            detail_amplification_local = (
                (1 - detail_amplification_local) * LOCAL_BOOST
            ) + 1  # [1, 1.2]
            detail_amplification_local = np.dstack(
                [detail_amplification_local] * 3
            )  # 3 channels
        else:
            detail_amplification_local = 1

        image_new_sat = (
            image_gray + image_delta * sat_degree * detail_amplification_local
        )

        image_new_sat = np.clip(a=image_new_sat, a_min=0, a_max=1, out=image_new_sat)

        return image_new_sat

    def enhance(self, image):

        gray = rgb2gray(image.copy())
        mask = self.get_photometric_mask(image.copy())

        # increase the local contrast of the grayscale image
        image_contrast = self.apply_local_contrast_enhancement(
            image=gray,
            image_ph_mask=mask,
            degree=self.parameters["local_contrast"],
        )

        # apply spatial tonemapping on the previous stage
        image_tonemapped = self.apply_spatial_tonemapping(
            image=image_contrast,
            image_ph_mask=mask,
            mid_tone=self.parameters["mid_tones"],
            tonal_width=self.parameters["tonal_width"],
            areas_dark=self.parameters["areas_dark"],
            areas_bright=self.parameters["areas_bright"],
            preserve_tones=self.parameters["preserve_tones"],
        )

        image_brightness = self.adjust_brightness(
            image_tonemapped, degree=self.parameters["brightness"]
        )

        # transfer the enhancement on the color image (in the linear color space)
        image_colortone = self.transfer_graytone_to_color(
            image_color=image, image_graytone=image_brightness
        )

        # apply color correction (if needed)
        if self.parameters["color_correction"] is True:
            image_colortone = self.correct_colors(image=image_colortone)

        # adjust the color saturation
        image_colortone_saturation = self.change_color_saturation(
            image_color=image_colortone,
            image_ph_mask=mask,
            sat_degree=self.parameters["saturation_degree"],
        )

        return image_colortone_saturation


if __name__ == "__main__":

    parser = ArgumentParser()
    parser.add_argument(
        "-i",
        "--image_dir",
        type=str,
        help="Path to the directory containing the image files",
    )
    parser.add_argument(
        "-o",
        "--out_dir",
        type=str,
        help="Path to the output directory, where the images will be saved",
    )

    args = parser.parse_args()

    directory = args.image_dir
    output_dir = args.out_dir
    os.makedirs(output_dir, exist_ok=True)

    parameters = {}
    parameters["local_contrast"] = 1.0  # no increase in details
    parameters["mid_tones"] = 0.2  # middle of range
    parameters["tonal_width"] = 0.3  # middle of range
    parameters["areas_dark"] = 0.2  # no change in dark areas
    parameters["areas_bright"] = 0.0  # no change in bright areas
    parameters["saturation_degree"] = 0.7  # no change in color saturation
    parameters["brightness"] = 0.2  # increase overall brightness
    parameters["preserve_tones"] = True
    parameters["color_correction"] = True
    enhancer = Enhancer(parameters)

    # List all images that are saved in a compressed format (JPEG, PNG, etc)
    compressed_images_list = list(list_images(directory))

    # List all images saved in a raw format with capitalized characters (CR3)
    raw_images_list = list(glob(os.path.join(directory, "*.CR3")))

    # List all images saved in a raw format with lowercase characters (cr3)
    raw_images_list_lower = list(glob(os.path.join(directory, "*.cr3")))

    # Sum all the image lists
    images_list = (
        set(compressed_images_list + raw_images_list + raw_images_list_lower)
    )

    for image_path in tqdm(images_list):

        # Convert raw images (CR3 files) to numpy arrays
        if image_path.lower().endswith(".cr3"):
            with rawpy.imread(image_path) as raw:
                image = raw.postprocess()
        # Read compressed images with OpenCV
        else:
            image = cv2.imread(image_path, 1)
            image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
                
        enhanced = enhancer.enhance(image)
        enhanced = np.ascontiguousarray(enhanced) * 255.0
        enhanced = enhanced.astype(np.uint8)

        # Remove spaces, "'" and "," from the filename
        image_name = image_path.split(sp)[-1].split(".")[0]
        image_name = image_name.replace(" ","_")
        image_name = image_name.replace("'","_")
        image_name = image_name.replace(",","_")
        
        new_path = os.path.join(output_dir, image_name + ".jpg")

        # Save the new image
        enhanced = cv2.cvtColor(enhanced, cv2.COLOR_RGB2BGR)
        cv2.imwrite(new_path, enhanced)

    print(f"Enhanced pictures with Skimage saved to {output_dir}")