first commit

ameraner · Nov 4, 2020 · 73c379b · 73c379b
1 parent 3f7fc43
commit 73c379b
Show file tree

Hide file tree

Showing 11 changed files with 1,425 additions and 0 deletions.
diff --git a/Code/dsen2cr_main.py b/Code/dsen2cr_main.py
@@ -0,0 +1,179 @@
+from __future__ import division
+
+import argparse
+import random
+
+import keras.backend as K
+import numpy as np
+import tensorflow as tf
+import tools.image_metrics as img_met
+from dsen2cr_network import DSen2CR_model
+from dsen2cr_tools import train_dsen2cr, predict_dsen2cr
+from keras.optimizers import Nadam
+from keras.utils import multi_gpu_model
+from tools.dataIO import get_train_val_test_filelists
+
+K.set_image_data_format('channels_first')
+
+
+def run_dsen2cr(predict_file=None, resume_file=None):
+    # %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+    # %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% SETUP %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+    # %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+    # TODO implement external hyperparam config file
+    # %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% Setup model %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+
+    model_name = 'DSen2-CR_001'  # model name for training
+
+    # model parameters
+    num_layers = 16  # B value in paper
+    feature_size = 256  # F value in paper
+
+    # include the SAR layers as input to model
+    include_sar_input = True
+
+    # cloud mask parameters
+    use_cloud_mask = True
+    cloud_threshold = 0.2  # set threshold for binarisation of cloud mask
+
+    # %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% Setup data processing param %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+
+    # input data preprocessing parameters
+    scale = 2000
+    max_val_sar = 2
+    clip_min = [[-25.0, -32.5], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]]
+    clip_max = [[0, 0], [10000, 10000, 10000, 10000, 10000, 10000, 10000, 10000, 10000, 10000, 10000, 10000, 10000],
+                [10000, 10000, 10000, 10000, 10000, 10000, 10000, 10000, 10000, 10000, 10000, 10000, 10000]]
+
+    shuffle_train = True  # shuffle images at training time
+    data_augmentation = True  # flip and rotate images randomly for data augmentation
+
+    random_crop = True  # crop out a part of the input image randomly
+    crop_size = 128  # crop size for training images
+
+    # %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% Setup training %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+
+    dataset_list_filepath = '../Data/datasetfilelist.csv'
+
+    base_out_path = '/path/to/output/model_runs/'
+    input_data_folder = '/path/to/dataset/parent/folder'
+
+    # training parameters
+    initial_epoch = 0  # start at epoch number
+    epochs_nr = 8  # train for this amount of epochs. Checkpoints will be generated at the end of each epoch
+    batch_size = 16  # training batch size to distribute over GPUs
+
+    # define metric to be optimized
+    loss = img_met.carl_error
+    # define metrics to monitor
+    metrics = [img_met.carl_error, img_met.cloud_mean_absolute_error,
+               img_met.cloud_mean_squared_error, img_met.cloud_mean_sam, img_met.cloud_mean_absolute_error_clear,
+               img_met.cloud_psnr,
+               img_met.cloud_root_mean_squared_error, img_met.cloud_bandwise_root_mean_squared_error,
+               img_met.cloud_mean_absolute_error_covered, img_met.cloud_ssim,
+               img_met.cloud_mean_sam_covered, img_met.cloud_mean_sam_clear]
+
+    # define learning rate
+    lr = 7e-5
+
+    # initialize optimizer
+    optimizer = Nadam(lr=lr, beta_1=0.9, beta_2=0.999, epsilon=1e-8, schedule_decay=0.004)
+
+    # %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% Other setup parameters %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+
+    predict_data_type = 'val'  # possible options: 'val' or 'test'
+
+    log_step_freq = 1  # frequency of logging
+
+    n_gpus = 1  # set number of GPUs
+    # multiprocessing optimization setup
+    use_multi_processing = True
+    max_queue_size = 2 * n_gpus
+    workers = 4 * n_gpus
+
+    batch_per_gpu = int(batch_size / n_gpus)
+
+    input_shape = ((13, crop_size, crop_size), (2, crop_size, crop_size))
+
+    # %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% Initialize session %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+
+    # Configure Tensorflow session
+    config = tf.ConfigProto()
+    # Don't pre-allocate memory; allocate as-needed
+    config.gpu_options.allow_growth = True
+
+    # Only allow a total % of the GPU memory to be allocated
+    # config.gpu_options.per_process_gpu_memory_fraction = 0.3
+
+    # Create a session with the above options specified.
+    K.tensorflow_backend.set_session(tf.Session(config=config))
+
+    # Set random seeds for repeatability
+    random_seed_general = 42
+    random.seed(random_seed_general)  # random package
+    np.random.seed(random_seed_general)  # numpy package
+    tf.set_random_seed(random_seed_general)  # tensorflow
+
+    # %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% Initialize model %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+
+    # single or no-gpu case
+    if n_gpus <= 1:
+        model, shape_n = DSen2CR_model(input_shape,
+                                       batch_per_gpu=batch_per_gpu,
+                                       num_layers=num_layers,
+                                       feature_size=feature_size,
+                                       use_cloud_mask=use_cloud_mask,
+                                       include_sar_input=include_sar_input)
+    else:
+        # handle multiple gpus
+        with tf.device('/cpu:0'):
+            single_model, shape_n = DSen2CR_model(input_shape,
+                                                  batch_per_gpu=batch_per_gpu,
+                                                  num_layers=num_layers,
+                                                  feature_size=feature_size,
+                                                  use_cloud_mask=use_cloud_mask,
+                                                  include_sar_input=include_sar_input)
+
+        model = multi_gpu_model(single_model, gpus=n_gpus)
+
+    model.compile(optimizer=optimizer, loss=loss, metrics=metrics)
+    print('Model compiled successfully!')
+
+    print("Getting file lists")
+    train_filelist, val_filelist, test_filelist = get_train_val_test_filelists(dataset_list_filepath)
+
+    print("Number of train files found: ", len(train_filelist))
+    print("Number of validation files found: ", len(val_filelist))
+    print("Number of test files found: ", len(test_filelist))
+
+    # %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% PREDICT %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+    if predict_file is not None:
+        if predict_data_type == 'val':
+            predict_filelist = val_filelist
+        elif predict_data_type == 'test':
+            predict_filelist = test_filelist
+        else:
+            raise ValueError('Prediction data type not recognized.')
+
+        predict_dsen2cr(predict_file, model, predict_data_type, base_out_path, input_data_folder, predict_filelist,
+                        batch_size, clip_min, clip_max, crop_size, input_shape, use_cloud_mask, cloud_threshold,
+                        max_val_sar, scale)
+
+    else:
+        # %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% TRAIN %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+
+        train_dsen2cr(model, model_name, base_out_path, resume_file, train_filelist, val_filelist, lr, log_step_freq,
+                      shuffle_train, data_augmentation, random_crop, batch_size, scale, clip_max, clip_min, max_val_sar,
+                      use_cloud_mask, cloud_threshold, crop_size, epochs_nr, initial_epoch, input_data_folder,
+                      input_shape, max_queue_size, use_multi_processing, workers)
+
+
+# %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% MAIN %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+
+if __name__ == '__main__':
+    parser = argparse.ArgumentParser(description='DSen2-CR model code')
+    parser.add_argument('--predict', action='store', dest='predict_file', help='Predict from model checkpoint.')
+    parser.add_argument('--resume', action='store', dest='resume_file', help='Resume training from model checkpoint.')
+    args = parser.parse_args()
+
+    run_dsen2cr(args.predict_file, args.resume_file)
diff --git a/Code/dsen2cr_network.py b/Code/dsen2cr_network.py
@@ -0,0 +1,70 @@
+import keras.backend as K
+import tensorflow as tf
+from keras.layers import Conv2D, Concatenate, Activation, Lambda, Add
+from keras.models import Model, Input
+
+K.set_image_data_format('channels_first')
+
+
+def resBlock(input_l, feature_size, kernel_size, scale=0.1):
+    """Definition of Residual Block to be repeated in body of network."""
+    tmp = Conv2D(feature_size, kernel_size, kernel_initializer='he_uniform', padding='same')(input_l)
+    tmp = Activation('relu')(tmp)
+    tmp = Conv2D(feature_size, kernel_size, kernel_initializer='he_uniform', padding='same')(tmp)
+
+    tmp = Lambda(lambda x: x * scale)(tmp)
+
+    return Add()([input_l, tmp])
+
+
+def DSen2CR_model(input_shape,
+                  batch_per_gpu=2,
+                  num_layers=32,
+                  feature_size=256,
+                  use_cloud_mask=True,
+                  include_sar_input=True):
+    """Definition of network structure. """
+
+    global shape_n
+
+    # define dimensions
+    input_opt = Input(shape=input_shape[0])
+    input_sar = Input(shape=input_shape[1])
+
+    if include_sar_input:
+        x = Concatenate(axis=1)([input_opt, input_sar])
+    else:
+        x = input_opt
+
+    # Treat the concatenation
+    x = Conv2D(feature_size, (3, 3), kernel_initializer='he_uniform', padding='same')(x)
+    x = Activation('relu')(x)
+
+    # main body of network as succession of resblocks
+    for i in range(num_layers):
+        x = resBlock(x, feature_size, kernel_size=[3, 3])
+
+    # One more convolution
+    x = Conv2D(input_shape[0][0], (3, 3), kernel_initializer='he_uniform', padding='same')(x)
+
+    # Add first layer (long skip connection)
+    x = Add()([x, input_opt])
+
+    if use_cloud_mask:
+        # the hacky trick with global variables and with lambda functions is needed to avoid errors when
+        # pickle saving the model. Tensors are not pickable.
+        # This way, the Lambda function has no special arguments and is "encapsulated"
+
+        shape_n = tf.shape(input_opt)
+
+        def concatenate_array(x):
+            global shape_n
+            return K.concatenate([x, K.zeros(shape=(batch_per_gpu, 1, shape_n[2], shape_n[3]))], axis=1)
+
+        x = Concatenate(axis=1)([x, input_opt])
+
+        x = Lambda(concatenate_array)(x)
+
+    model = Model(inputs=[input_opt, input_sar], outputs=x)
+
+    return model, shape_n