Deblurring/preprocessing.py at master · Mat092/Deblurring · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
'''
Some function to ease preprocessing operation
'''

import os
import random

from tensorflow.keras.datasets import cifar10

from sklearn.model_selection import train_test_split as tts

import numpy as np
from matplotlib import pyplot as plt

# TODO : need to comment that for a second sorry (conflict with tensorflow-gpu in miniconda)
# import cv2
#
# def blur_input(dataset, sigma=None):
#
#   # TODO : Should do a better control on how sigma values are passed
#   if sigma is None:
#     sigma = np.random.uniform(low=0., high=3., size=len(dataset))
#
#   # If sigmaY is 0, the value from sigmaX is used. TODO : border Type?
#   # TODO : It is possible to do this with multiprocessing for speed up, but maybe not necessary.
#   y = [cv2.GaussianBlur(img, ksize=(0,0), sigmaX=s, sigmaY=0., borderType=cv2.BORDER_DEFAULT)
#        for img, s in zip(dataset, sigma) ]
#
#   return np.asarray(y, dtype='float32')


def cifar_download_and_scale():
  '''
  Download and scale the CIFAR_10 dataset from tensorflow.
  '''

  # Input image dimensions
  img_rows, img_cols, channels = 32, 32, 3
  inputs  = img_rows * img_cols * channels
  outputs = img_rows * img_cols * channels

  # The data, split between train and test sets:
  (x_train, _), (x_test, _) = cifar10.load_data()

  x_train = x_train.reshape(x_train.shape[0], img_rows, img_cols, channels)
  x_test  = x_test.reshape( x_test.shape[0] , img_rows, img_cols, channels)

  # normalize to [0., 1.] range
  x_train = x_train.astype('float32') / 255.
  x_test  = x_test.astype('float32')  / 255.

  # Concatenate, we don't need the split yet
  dataset = np.concatenate([x_train, x_test], axis=0)

  return dataset


def train_test(input, target, test_size=0.1):
  '''
  Simple wrap of train_test_split from scikit.
  '''

  x_train, x_test, y_train, y_test = tts(input, target,
                                        test_size=test_size,
                                        train_size=None,
                                        random_state=None,
                                        shuffle=True,
                                        stratify=None
                                        )

  return x_train, x_test, y_train, y_test


def transform(data):
  '''
  fourier transform of ta batch of images in dataset and blurred
  '''
  return np.fft.fftn(data, s=None, axes=(1, 2, 3), norm=None)


def anti_tranform(data):
  '''
  Compute the anti-fourier transform of a batch of images
  '''
  return np.fft.ifftn(data, s=None, axes=(1, 2, 3), norm=None)


def read_REDS(test_size=0.1):

  sharpdir = os.path.join(os.getcwd(), 'data', 'redREDS', 'sharp')
  blurdir  = os.path.join(os.getcwd(), 'data', 'redREDS', 'blur')

  # Read all files names from directories
  sharp_paths = sorted(os.listdir(sharpdir))
  blur_paths  = sorted(os.listdir(blurdir))

  test_num  = int(len(sharp_paths) * test_size)

  x_train_list = []
  y_train_list = []

  x_test_list = []
  y_test_list = []

  # Add absolute path
  for i, sharp_name in enumerate(sharp_paths):

    blur_name = sharp_name.replace('sharp', 'blur')

    blur_path  = os.path.join(blurdir,  blur_name)
    sharp_path = os.path.join(sharpdir, sharp_name)

    x_train_list.append(blur_path)
    y_train_list.append(sharp_path)

  # Create test lists and train list
  for i in range(test_num):

    # Same names selection (RANDOM)
    sharp_name = random.choice(y_train_list)
    blur_name  = sharp_name.replace('sharp', 'blur')

    # Add to test sets
    x_test_list.append(blur_name)
    y_test_list.append(sharp_name)

    # Remove from train set
    x_train_list.remove(blur_name)
    y_train_list.remove(sharp_name)

  return x_train_list, x_test_list, y_train_list, y_test_list

if __name__ == '__main__':

  # TESTING, DON'T DIVE IN, IT'S TERRIBLE.

  # Blur and save the dataset.
  datafile = os.path.join(os.getcwd(), 'data', 'cifar10.npy')
  outfile  = os.path.join(os.getcwd(), 'data', 'cifar10_blur_sigma0-3.npy')

  dataset  = np.load(datafile)

  # Blur and save
  # blurred  = blur_input(dataset)
  # np.save(outfile, blurred)

  blurred = np.load(outfile)

  img_num = 184

  plt.imshow(blurred[img_num])
  plt.imshow(dataset[img_num])

  blur  = blurred[img_num]
  sharp = dataset[img_num]

  blur  = cv2.cvtColor(blur, cv2.COLOR_BGR2RGB)
  sharp = cv2.cvtColor(sharp, cv2.COLOR_BGR2RGB)
  cv2.imwrite('images/car_sharp.png', sharp * 255)
  cv2.imwrite('images/car_blur.png', blur  * 255)

  def show_image(inpt1, inpt2):

    img_num = np.random.randint(low=0, high=len(dataset-1))

    orig = inpt1[img_num]
    blur = inpt2[img_num]

    # Small Visual Test for blurring

    fig, (ax1, ax2) = plt.subplots(nrows=1, ncols=2, figsize=(12,5))

    ax1.imshow(orig)
    ax1.set_title('Original Image')
    ax1.set_xticks([])
    ax1.set_yticks([])

    ax2.imshow(blur)
    ax2.set_title('Blurred Image')
    ax2.set_xticks([])
    ax2.set_yticks([])

    plt.show();

  # show_image(dataset, blurred)

  # Some Fourier transformation.

  outfile_ft  = os.path.join(os.getcwd(), 'data', 'cifar10_FT.npy')
  blurfile_ft = os.path.join(os.getcwd(), 'data', 'cifar10_blur_sigma0-3_FT.npy')

  ft = transform(dataset[:20000])

  ft_shift = np.log(np.abs(ft))

  # shift = np.fft.fftshift(ft)

  plt.imshow(ft_shift[0] / ft_shift[0].max())

  data = np.real(anti_tranform(ft))

  plt.imshow(data[0])

  np.abs(data - dataset[:100]).max()

  ft_blur = transform(blurred[:])

  np.save(outfile_ft,  ft_shift)
  np.save(blurfile_ft, ft_blur)

#%%