update resize function

IceClear · IceClear · commit 81de83e6faf0 · 2021-12-13T15:54:11.000+08:00
diff --git a/IL-NIQE.py b/IL-NIQE.py
@@ -12,6 +12,7 @@
 
 import time
 # import ray
+from matlab_resize import MATLABLikeResize
 
 def reorder_image(img, input_order='HWC'):
     """Reorder images to 'HWC' order.
@@ -245,7 +246,11 @@ def ilniqe(img, mu_pris_param, cov_pris_param, gaussian_window, principleVectors
     nanConst = 2000
 
     if resize:
-        img = cv2.resize(img, (normalizedWidth, normalizedWidth), interpolation=cv2.INTER_AREA)
+        # img = cv2.resize(img, (normalizedWidth, normalizedWidth), interpolation=cv2.INTER_AREA)
+        resize_func = MATLABLikeResize(output_shape=(normalizedWidth, normalizedWidth))
+        img = resize_func.resize_img(img)
+        img = np.clip(img, 0.0, 255.0)
+
     h, w, _ = img.shape
 
     num_block_h = math.floor(h / block_size_h)
diff --git a/README.md b/README.md
@@ -22,21 +22,19 @@ You can also train your own model via training.m in the Matlab version. But the
 
 |Image|IL-NIQE (using official .mat) (Matlab/Python)|IL-NIQE (using .mat trained in python) (Python)|IL-NIQE (w/o imresize) (Matlab/Python)|Time(sec) (Matlab/Python)|
 |:-|:-|:-|:-|:-|
-|pepper_0.png|29.1422 / 27.3655|28.1166|38.7078 / 38.9319|9.9567 / 103.4350|
-|pepper_1.png|36.9637 / 39.0683|38.7309|36.6869 / 37.0163|9.7487 / 90.1218|
-|pepper_2.png|29.5075 / 31.5751|29.5121|28.7137 / 28.6329|10.3733 / 103.6504|
-|pepper_3.png|78.0557 / 58.6855|49.9387|92.3750 / 92.9693|10.5093 / 97.8555|
-|pepper_4.png|46.8697 / 54.2524|41.9770|46.4926 / 46.8856|9.7452 / 103.4113|
+|pepper_0.png|29.1422 / 28.8966|30.3513|38.7078 / 38.9319|9.9567 / 103.4350|
+|pepper_1.png|36.9637 / 37.4120|37.6577|36.6869 / 37.0163|9.7487 / 90.1218|
+|pepper_2.png|29.5075 / 28.9969|28.4353|28.7137 / 28.6329|10.3733 / 103.6504|
+|pepper_3.png|78.0557 / 83.3886|74.5166|92.3750 / 92.9693|10.5093 / 97.8555|
+|pepper_4.png|46.8697 / 51.7191|46.9279|46.4926 / 46.8856|9.7452 / 103.4113|
 
 For Matlab, it uses parpool for multiprocessing and is much faster than python. This implement supports multiprocessing via ray.
 
-* Accuracy: Generally, without resizing the image, the difference is smaller than 1. I think this can be accepted since at current stage, no-reference metric cannot accurately reflect the quality of an image.
 * Difference: The main reasons of the difference may be due to the precision of float computing and different results of similar functions of Matlab and Python, i.e., imresize. (The large differences for 'pepper_3.png' and 'pepper_4.png' are mainly due to resize.)
 
 After comparision, I have found some lines which generate different results, it can be more accurate if you can provide a better function to replace the current one:
 
-- [imresize function:](https://github.com/IceClear/IL-NIQE/blob/master/IL-NIQE.py#L249) The difference between the imresize function between cv2 and Matlab seems affect the results the most. Maybe the solution is to rewrite the function in python.
+- [imresize function:](https://github.com/IceClear/IL-NIQE/blob/master/IL-NIQE.py#L249) The difference between the imresize function between python and Matlab seems affect the results the most. Maybe the solution is to rewrite the function in python.
 - [var:](https://github.com/IceClear/IL-NIQE/blob/master/IL-NIQE.py#L111) The varience of numpy is sometimes different from the var() function in Matlab. The difference is smaller than 1. Reasons are unknoen yet.
-- [mean:](https://github.com/IceClear/IL-NIQE/blob/master/IL-NIQE.py#L110) When the number is very small (<1e-15), this function will fail due to the limit of float64. This seems not the main problem.
 
 Any suggestions for improvement are welcomed.
diff --git a/matlab_resize.py b/matlab_resize.py
@@ -0,0 +1,276 @@
+# This code is referenced from matlab_imresize with modifications
+# Reference: https://github.com/fatheral/matlab_imresize/blob/master/imresize.py  # noqa
+# Original licence: Copyright (c) 2020 fatheral, under the MIT License.
+# Modified from MMediting: https://github.com/open-mmlab/mmediting
+import numpy as np
+
+
+def get_size_from_scale(input_size, scale_factor):
+    """Get the output size given input size and scale factor.
+
+    Args:
+        input_size (tuple): The size of the input image.
+        scale_factor (float): The resize factor.
+
+    Returns:
+        list[int]: The size of the output image.
+    """
+
+    output_shape = [
+        int(np.ceil(scale * shape))
+        for (scale, shape) in zip(scale_factor, input_size)
+    ]
+
+    return output_shape
+
+
+def get_scale_from_size(input_size, output_size):
+    """Get the scale factor given input size and output size.
+
+    Args:
+        input_size (tuple(int)): The size of the input image.
+        output_size (tuple(int)): The size of the output image.
+
+    Returns:
+        list[float]: The scale factor of each dimension.
+    """
+
+    scale = [
+        1.0 * output_shape / input_shape
+        for (input_shape, output_shape) in zip(input_size, output_size)
+    ]
+
+    return scale
+
+
+def _cubic(x):
+    """ Cubic function.
+
+    Args:
+        x (ndarray): The distance from the center position.
+
+    Returns:
+        ndarray: The weight corresponding to a particular distance.
+
+    """
+
+    x = np.array(x, dtype=np.float32)
+    x_abs = np.abs(x)
+    x_abs_sq = x_abs**2
+    x_abs_cu = x_abs_sq * x_abs
+
+    # if |x| <= 1: y = 1.5|x|^3 - 2.5|x|^2 + 1
+    # if 1 < |x| <= 2: -0.5|x|^3 + 2.5|x|^2 - 4|x| + 2
+    f = (1.5 * x_abs_cu - 2.5 * x_abs_sq + 1) * (x_abs <= 1) + (
+        -0.5 * x_abs_cu + 2.5 * x_abs_sq - 4 * x_abs + 2) * ((1 < x_abs) &
+                                                             (x_abs <= 2))
+
+    return f
+
+
+def get_weights_indices(input_length, output_length, scale, kernel,
+                        kernel_width):
+    """Get weights and indices for interpolation.
+
+    Args:
+        input_length (int): Length of the input sequence.
+        output_length (int): Length of the output sequence.
+        scale (float): Scale factor.
+        kernel (func): The kernel used for resizing.
+        kernel_width (int): The width of the kernel.
+
+    Returns:
+        list[ndarray]: The weights and the indices for interpolation.
+
+
+    """
+    if scale < 1:  # modified kernel for antialiasing
+
+        def h(x):
+            return scale * kernel(scale * x)
+
+        kernel_width = 1.0 * kernel_width / scale
+    else:
+        h = kernel
+        kernel_width = kernel_width
+
+    # coordinates of output
+    x = np.arange(1, output_length + 1).astype(np.float32)
+
+    # coordinates of input
+    u = x / scale + 0.5 * (1 - 1 / scale)
+    left = np.floor(u - kernel_width / 2)  # leftmost pixel
+    p = int(np.ceil(kernel_width)) + 2  # maximum number of pixels
+
+    # indices of input pixels
+    ind = left[:, np.newaxis, ...] + np.arange(p)
+    indices = ind.astype(np.int32)
+
+    # weights of input pixels
+    weights = h(u[:, np.newaxis, ...] - indices - 1)
+
+    weights = weights / np.sum(weights, axis=1)[:, np.newaxis, ...]
+
+    # remove all-zero columns
+    aux = np.concatenate(
+        (np.arange(input_length), np.arange(input_length - 1, -1,
+                                            step=-1))).astype(np.int32)
+    indices = aux[np.mod(indices, aux.size)]
+    ind2store = np.nonzero(np.any(weights, axis=0))
+    weights = weights[:, ind2store]
+    indices = indices[:, ind2store]
+
+    return weights, indices
+
+
+def resize_along_dim(img_in, weights, indices, dim):
+    """Resize along a specific dimension.
+
+    Args:
+        img_in (ndarray): The input image.
+        weights (ndarray): The weights used for interpolation, computed from
+            [get_weights_indices].
+        indices (ndarray): The indices used for interpolation, computed from
+            [get_weights_indices].
+        dim (int): Which dimension to undergo interpolation.
+
+    Returns:
+        ndarray: Interpolated (along one dimension) image.
+    """
+
+    img_in = img_in.astype(np.float32)
+    w_shape = weights.shape
+    output_shape = list(img_in.shape)
+    output_shape[dim] = w_shape[0]
+    img_out = np.zeros(output_shape)
+
+    if dim == 0:
+        for i in range(w_shape[0]):
+            w = weights[i, :][np.newaxis, ...]
+            ind = indices[i, :]
+            img_slice = img_in[ind, :]
+            img_out[i] = np.sum(np.squeeze(img_slice, axis=0) * w.T, axis=0)
+    elif dim == 1:
+        for i in range(w_shape[0]):
+            w = weights[i, :][:, :, np.newaxis]
+            ind = indices[i, :]
+            img_slice = img_in[:, ind]
+            img_out[:, i] = np.sum(np.squeeze(img_slice, axis=1) * w.T, axis=1)
+
+    if img_in.dtype == np.uint8:
+        img_out = np.clip(img_out, 0, 255)
+        return np.around(img_out).astype(np.uint8)
+    else:
+        return img_out
+
+
+class MATLABLikeResize:
+    """Resize the input image using MATLAB-like downsampling.
+
+        Currently support bicubic interpolation only. Note that the output of
+        this function is slightly different from the official MATLAB function.
+
+        Required keys are the keys in attribute "keys". Added or modified keys
+        are "scale" and "output_shape", and the keys in attribute "keys".
+
+        Args:
+            keys (list[str]): A list of keys whose values are modified.
+            scale (float | None, optional): The scale factor of the resize
+                operation. If None, it will be determined by output_shape.
+                Default: None.
+            output_shape (tuple(int) | None, optional): The size of the output
+                image. If None, it will be determined by scale. Note that if
+                scale is provided, output_shape will not be used.
+                Default: None.
+            kernel (str, optional): The kernel for the resize operation.
+                Currently support 'bicubic' only. Default: 'bicubic'.
+            kernel_width (float): The kernel width. Currently support 4.0 only.
+                Default: 4.0.
+    """
+
+    def __init__(self,
+                 keys=None,
+                 scale=None,
+                 output_shape=None,
+                 kernel='bicubic',
+                 kernel_width=4.0):
+
+        if kernel.lower() != 'bicubic':
+            raise ValueError('Currently support bicubic kernel only.')
+
+        if float(kernel_width) != 4.0:
+            raise ValueError('Current support only width=4 only.')
+
+        if scale is None and output_shape is None:
+            raise ValueError('"scale" and "output_shape" cannot be both None')
+
+        self.kernel_func = _cubic
+        self.keys = keys
+        self.scale = scale
+        self.output_shape = output_shape
+        self.kernel = kernel
+        self.kernel_width = kernel_width
+
+    def resize_img(self, img):
+        return self._resize(img)
+
+    def _resize(self, img):
+        weights = {}
+        indices = {}
+
+        # compute scale and output_size
+        if self.scale is not None:
+            scale = float(self.scale)
+            scale = [scale, scale]
+            output_size = get_size_from_scale(img.shape, scale)
+        else:
+            scale = get_scale_from_size(img.shape, self.output_shape)
+            output_size = list(self.output_shape)
+
+        # apply cubic interpolation along two dimensions
+        order = np.argsort(np.array(scale))
+        for k in range(2):
+            key = (img.shape[k], output_size[k], scale[k], self.kernel_func,
+                   self.kernel_width)
+            weight, index = get_weights_indices(img.shape[k], output_size[k],
+                                                scale[k], self.kernel_func,
+                                                self.kernel_width)
+            weights[key] = weight
+            indices[key] = index
+
+        output = np.copy(img)
+        if output.ndim == 2:  # grayscale image
+            output = output[:, :, np.newaxis]
+
+        for k in range(2):
+            dim = order[k]
+            key = (img.shape[dim], output_size[dim], scale[dim],
+                   self.kernel_func, self.kernel_width)
+            output = resize_along_dim(output, weights[key], indices[key], dim)
+
+        return output
+
+    def __call__(self, results):
+        for key in self.keys:
+            is_single_image = False
+            if isinstance(results[key], np.ndarray):
+                is_single_image = True
+                results[key] = [results[key]]
+
+            results[key] = [self._resize(img) for img in results[key]]
+
+            if is_single_image:
+                results[key] = results[key][0]
+
+        results['scale'] = self.scale
+        results['output_shape'] = self.output_shape
+
+        return results
+
+    def __repr__(self):
+        repr_str = self.__class__.__name__
+        repr_str += (
+            f'(keys={self.keys}, scale={self.scale}, '
+            f'output_shape={self.output_shape}, '
+            f'kernel={self.kernel}, kernel_width={self.kernel_width})')
+        return repr_str
diff --git a/python_templateModel.mat b/python_templateModel.mat
diff --git a/train.py b/train.py
@@ -11,6 +11,8 @@
 from scipy.stats import exponweib
 from scipy.optimize import fmin
 import time
+from matlab_resize import MATLABLikeResize
+from tqdm import tqdm
 
 def MyPCA(sampleData, reservedRatio):
     principleVectors = []
@@ -218,17 +220,20 @@ def train(data_path):
     gaussian_window = matlab_fspecial((5,5),5/6)
     gaussian_window = gaussian_window/np.sum(gaussian_window)
 
-    trainingFiles = os.listdir(data_path)
+    trainingFiles = sorted(os.listdir(data_path))
 
     pic_features = []
     pic_sharpness = []
 
-    for img_file in trainingFiles:
+    for img_file in tqdm(trainingFiles):
         img = cv2.imread(os.path.join(data_path, img_file))
         img = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
         img = img.astype(np.float64)
         img = img.round()
-        img = cv2.resize(img, (normalizedWidth, normalizedWidth),interpolation=cv2.INTER_AREA)
+        # img = cv2.resize(img, (normalizedWidth, normalizedWidth),interpolation=cv2.INTER_AREA)
+        resize_func = MATLABLikeResize(output_shape=(normalizedWidth, normalizedWidth))
+        img = resize_func.resize_img(img)
+        img = np.clip(img, 0.0, 255.0)
 
         h, w, _ = img.shape
 
@@ -352,7 +357,6 @@ def train(data_path):
         distparam = np.concatenate(distparam, axis=1)
         pic_features.append(np.array(distparam))
         pic_sharpness.append(sharpness)
-        print(img_file, flush=True)
 
     prisparam = None
     for i in range(len(pic_features)):