import os
os.environ['KERAS_BACKEND'] = 'torch'

import keras

import numpy as np
import sys

from skimage import io
from skimage.util import random_noise

import modules.MNIST
from modules.MNIST     import MNIST

import fidle

# Init Fidle environment
run_id, run_dir, datasets_dir = fidle.init('K3AE1')

Version              : 2.3.2
Run id               : K3AE1
Run dir              : ./run/K3AE1
Datasets dir         : /lustre/fswork/projects/rech/mlh/uja62cb/fidle-project/datasets-fidle
Start time           : 22/12/24 21:23:38
Hostname             : r3i6n0 (Linux)
Tensorflow log level : Info + Warning + Error  (=0)
Update keras cache   : False
Update torch cache   : False
Save figs            : ./run/K3AE1/figs (True)
keras                : 3.7.0
numpy                : 2.1.2
sklearn              : 1.5.2
yaml                 : 6.0.2
skimage              : 0.24.0
matplotlib           : 3.9.2
pandas               : 2.2.3
torch                : 2.5.0

prepared_dataset   = './data/mnist-noisy.h5'
scale              = 1
progress_verbosity = 1

fidle.override('prepared_dataset', 'scale', 'progress_verbosity')

** Overrided parameters : **
scale                : 1
progress_verbosity   : 2

clean_data, class_data = MNIST.get_origine(scale=scale)

Dataset loaded.
Normalized.
Reshaped.
Concatenate.
x shape : (70000, 28, 28, 1)
y shape : (70000,)

def noise_it(data):
    new_data = np.copy(data)
    for i,image in enumerate(new_data):
        fidle.utils.update_progress('Add noise : ',i+1,len(data),verbosity=progress_verbosity)
        image=random_noise(image, mode='gaussian', mean=0, var=0.3)
        image=random_noise(image, mode='s&p',      amount=0.2, salt_vs_pepper=0.5)
        image=random_noise(image, mode='poisson') 
        image=random_noise(image, mode='speckle',  mean=0, var=0.1)
        new_data[i]=image
    print('Done.')
    return new_data

# ---- Add noise to input data : x_data
#
noisy_data = noise_it(clean_data)

Add noise :      [########################################] 100.0% of 70000
Done.

print('Clean dataset (clean_data) : ',clean_data.shape)
print('Noisy dataset (noisy_data) : ',noisy_data.shape)

fidle.utils.subtitle("Noisy images we'll have in input (or x)")
fidle.scrawler.images(noisy_data[:5], None, indices='all', columns=5, x_size=3,y_size=3, interpolation=None, save_as='01-noisy')
fidle.utils.subtitle('Clean images we want to obtain (or y)')
fidle.scrawler.images(clean_data[:5], None, indices='all', columns=5, x_size=3,y_size=3, interpolation=None, save_as='02-original')

Clean dataset (clean_data) :  (70000, 28, 28, 1)
Noisy dataset (noisy_data) :  (70000, 28, 28, 1)

p = np.random.permutation(len(clean_data))
clean_data, noisy_data, class_data = clean_data[p], noisy_data[p], class_data[p]
print('Shuffled.')

Shuffled.

MNIST.save_prepared_dataset( clean_data, noisy_data, class_data, filename=prepared_dataset )

Saved.
clean_data shape is :  (70000, 28, 28, 1)
noisy_data shape is :  (70000, 28, 28, 1)
class_data shape is :  (70000,)

fidle.end()

[K3AE1] - Prepare a noisy MNIST dataset¶

Objectives :¶

What we're going to do :¶

Step 1 - Init and set parameters¶

1.1 - Init python¶

1.2 - Parameters¶

Step 2 - Get original dataset¶

Step 3 - Add noise¶

Step 4 - Have a look¶

Step 5 - Shuffle dataset¶

Step 6 - Save our prepared dataset¶