From 730e2bf0def02ba706f9de11a44680fd8cdd1f12 Mon Sep 17 00:00:00 2001
From: linakrisztian <106728040+linakrisztian@users.noreply.github.com>
Date: Wed, 14 Aug 2024 08:42:27 +0200
Subject: [PATCH 1/5] support of reading vrts beside tifs (#2)

---
 src/README.md           | 36 ++++++++++++++++++------------------
 src/cnn_lib.py          | 10 ++++++++--
 src/data_preparation.py | 13 ++++++++++---
 src/detect.py           |  5 ++++-
 src/utils.py            | 12 +++++++++++-
 5 files changed, 51 insertions(+), 25 deletions(-)

diff --git a/src/README.md b/src/README.md
index e248b113..cce33b9d 100644
--- a/src/README.md
+++ b/src/README.md
@@ -11,10 +11,10 @@ The dataset is expected to be provided in the following structure:
 ```
 path/to/my/dataset/
 ├── label_colors.txt
-├── im1_image.tif
-├── im1_label.tif
-├── im2_image.tif
-├── im2_label.tif
+├── im1_image.tif/.vrt
+├── im1_label.tif/.vrt
+├── im2_image.tif/.vrt
+├── im2_label.tif/.vrt
 └── ...
 ```
 
@@ -43,24 +43,24 @@ directories.
 ```
 path/to/my/dataset/
 ├── label_colors.txt
-├── im1_image.tif
-├── im1_label.tif
-├── im2_image.tif
-├── im2_label.tif
+├── im1_image.tif/.vrt
+├── im1_label.tif/.vrt
+├── im2_image.tif/.vrt
+├── im2_label.tif/.vrt
 ├── train_images
-│   ├── image_0.tif
-│   ├── image_1.tif
-│   ├── image_2.tif
-│   └── image_4.tif
+│   ├── image_0.tif/.vrt
+│   ├── image_1.tif/.vrt
+│   ├── image_2.tif/.vrt
+│   └── image_4.tif/.vrt
 ├── train_masks
-│   ├── image_0.tif
-│   ├── image_1.tif
-│   ├── image_2.tif
-│   └── image_4.tif
+│   ├── image_0.tif/.vrt
+│   ├── image_1.tif/.vrt
+│   ├── image_2.tif/.vrt
+│   └── image_4.tif/.vrt
 ├── val_images
-│   └── image_3.tif
+│   └── image_3.tif/.vrt
 └── val_masks
-    └── image_3.tif
+    └── image_3.tif/.vrt
 ```
 
 ## Training
diff --git a/src/cnn_lib.py b/src/cnn_lib.py
index 66724a51..f82ba103 100644
--- a/src/cnn_lib.py
+++ b/src/cnn_lib.py
@@ -1214,8 +1214,14 @@ def get_tf_dataset(data_dir, batch_size=5, operation='train',
     # create variables useful throughout the entire class
     nr_samples = len(os.listdir(images_dir))
 
-    img_filelist = list(pathlib.Path(images_dir).glob('*.tif'))
-    mask_filelist = list(pathlib.Path(masks_dir).glob('*.tif'))
+    img_filelist = sorted(
+        list(pathlib.Path(images_dir).glob('*.tif'))
+        + list(pathlib.Path(images_dir).glob('*.vrt'))
+    )
+    mask_filelist = sorted(
+        list(pathlib.Path(masks_dir).glob('*.tif'))
+        + list(pathlib.Path(masks_dir).glob('*.vrt'))
+    )
 
     image_count = len(img_filelist)
     mask_count = len(mask_filelist)
diff --git a/src/data_preparation.py b/src/data_preparation.py
index e5f8ec25..ebb40d84 100644
--- a/src/data_preparation.py
+++ b/src/data_preparation.py
@@ -44,9 +44,16 @@ def generate_dataset_structure(data_dir, tensor_shape=(256, 256),
     dir_names = train_val_determination(val_set_pct)
 
     # tile and write samples
-    source_images = sorted(glob.glob(os.path.join(data_dir, '*image.tif')))
-    for i in source_images:
-        tile(i, i.replace('image.tif', 'label.tif'), tensor_shape,
+    source_images = sorted(
+        glob.glob(os.path.join(data_dir, '*image.tif'))
+        + glob.glob(os.path.join(data_dir, '*image.vrt'))
+    )
+    source_label = sorted(
+        glob.glob(os.path.join(data_dir, '*label.tif'))
+        + glob.glob(os.path.join(data_dir, '*label.vrt'))
+    )
+    for i in range(len(source_images)):
+        tile(source_images[i], source_label[i], tensor_shape,
              filter_by_class, augment, dir_names, ignore_masks)
 
     # check if there are some training data
diff --git a/src/detect.py b/src/detect.py
index 86c1b66d..c2e513a4 100644
--- a/src/detect.py
+++ b/src/detect.py
@@ -24,7 +24,10 @@ def main(data_dir, model, in_weights_path, visualization_path, batch_size,
     if ignore_masks is False:
         # check if labels are provided
         import glob
-        if len(glob.glob(os.path.join(data_dir, '*label.tif'))) == 0:
+        if len(
+            glob.glob(os.path.join(data_dir, '*label.tif'))
+            + glob.glob(os.path.join(data_dir, '*label.vrt'))
+            ) == 0:
             raise DatasetError('No labels provided in the dataset.')
 
     # get nr of bands
diff --git a/src/utils.py b/src/utils.py
index c9aa7f90..fb9ad534 100644
--- a/src/utils.py
+++ b/src/utils.py
@@ -3,6 +3,7 @@
 import os
 import glob
 import argparse
+import sys
 
 import tensorflow as tf
 
@@ -24,11 +25,20 @@ def get_codings(description_file):
 
 
 def get_nr_of_bands(data_dir):
-    """Get number of bands in the first *image.tif raster in a directory.
+    """Get number of bands in the first *image.tif or first *.vrt raster in a directory.
 
     :param data_dir: directory with images for training or detection
     """
+    # check for tif
     images = glob.glob(os.path.join(data_dir, '*image.tif'))
+    # if no tif found check for vrt
+    if not images:
+        images = glob.glob(os.path.join(data_dir, '*.vrt'))
+    # if still nothing found return error message
+    if not images:
+        sys.exit("ERROR: No *image.tif or *.vrt found on top level of training directory."
+                 "Needed to determine number of bands of input")
+
     dataset_image = gdal.Open(images[0], gdal.GA_ReadOnly)
     nr_bands = dataset_image.RasterCount
     dataset_image = None

From 4d46d152e614d33d7532d7bd21c7ffec5f747498 Mon Sep 17 00:00:00 2001
From: linakrisztian <106728040+linakrisztian@users.noreply.github.com>
Date: Wed, 14 Aug 2024 12:09:42 +0200
Subject: [PATCH 2/5] Change input/output dimension for train-finetune (#1)

* implement FCN (#45)

* BaseModel classifier: support turning off onehot encoding

* fix typo in error message

* propagate summary definitions

allow changing the summary width

* VGG: fix wrong kwargs in get_config

* detect.py: support more TF versions for setting seed

* support of changing input and output channel dimension for finetune models

* remove non relvant changes from PR

* cleanup and comment changes

* checkout code-stand metz

* fix setting model weights

* fix load model weights

* AW review

---------

Co-authored-by: Ondrej Pesek <pesej.ondrek@gmail.com>
---
 src/train.py | 100 ++++++++++++++++++++++++++++++++++++++++++++++-----
 1 file changed, 92 insertions(+), 8 deletions(-)

diff --git a/src/train.py b/src/train.py
index d2d432f8..4cc2e2f7 100644
--- a/src/train.py
+++ b/src/train.py
@@ -2,6 +2,7 @@
 
 import os
 import argparse
+import sys
 
 import numpy as np
 import tensorflow as tf
@@ -21,6 +22,66 @@ def rescale_image(input_image, input_mask):
 
     return input_image, input_mask
 
+def load_pretrained_model(model, id2code,
+                          tensor_shape, loss_function, tversky_alpha, tversky_beta,
+                          dropout_rate_input, dropout_rate_hidden, backbone, name,
+                          in_weights_path, model_new,
+                          finetune_old_inp_dim, finetune_old_out_dim):
+    # if input or output dimension changed w.r.t pretrained model
+    if finetune_old_inp_dim or finetune_old_out_dim:
+        if model == "U-Net":
+            # set dimensions for creating pretrained model
+            if finetune_old_inp_dim:
+                nr_bands = finetune_old_inp_dim
+            if finetune_old_out_dim:
+                num_class = finetune_old_out_dim
+            else:
+                num_class = len(id2code)
+
+            # creating model with dimensions of pretrained model
+            # NOTE: do not set create_model to verbose=False
+            # --> need once run model.summary() -> otherwise model dimensions are not set
+            print("------------------------------")
+            print("-- Start: Dimensions of OLD Model: --")
+            print("------------------------------")
+            model_old = create_model(
+                model, num_class , nr_bands, tensor_shape, nr_filters=32, loss=loss_function,
+                alpha=tversky_alpha, beta=tversky_beta,
+                dropout_rate_input=dropout_rate_input,
+                dropout_rate_hidden=dropout_rate_hidden, backbone=backbone, name=name)
+            print("----------------------------------")
+            print("-- End: Dimensions of OLD Model: --")
+            print("----------------------------------")
+            # load model weights of pretrained model
+            model_old.load_weights(in_weights_path)
+
+            # Set weights of new model, with weights of pretrained model
+            # NOTE: model.layers returns list of model layers BUT not necessarily in the correct order
+            # Thus have to explicitely check for first and last layer index
+            # Get all layer names:
+            layer_names = [layer.name for layer in model_new.layers]
+            # Get layer index of first downsampling block
+            chlayer_first = model_new.ds_blocks[0].name
+            ind_chlayer_first = layer_names.index(chlayer_first)
+            # Get layer index of last layer od model
+            chlayer_last = "classifier_layer"
+            ind_chlayer_last = layer_names.index(chlayer_last)
+            # iterate over all layers to set the weights
+            for ind in range(0,len(model_new.layers)):
+                # if input dimension changed, don't set weigts for this layer in new model
+                if ind == ind_chlayer_first and finetune_old_inp_dim:
+                    continue
+                # if output dimension changed, don't set weigts for this layer in new model
+                if ind == ind_chlayer_last and finetune_old_out_dim:
+                    continue
+                # set weights from pretrained model, for all remaining layers
+                model_new.layers[ind].set_weights(model_old.layers[ind].get_weights())
+        else:
+            sys.exit("ERROR: Change of input or output dimensions w.r.t pretrained models only "
+                        "supported for U-Net so far (parameter --finetune_old_inp_dim or --finetune_old_out_dim)")
+    else:
+        # if model dimension did not chainged, load weights from complete model
+        model_new.load_weights(in_weights_path)
 
 def main(operation, data_dir, output_dir, model, model_fn, in_weights_path=None,
          visualization_path='/tmp', nr_epochs=1, initial_epoch=0, batch_size=1,
@@ -28,8 +89,10 @@ def main(operation, data_dir, output_dir, model, model_fn, in_weights_path=None,
          monitored_value='val_accuracy', force_dataset_generation=False,
          fit_memory=False, augment=False, tversky_alpha=0.5,
          tversky_beta=0.5, dropout_rate_input=None, dropout_rate_hidden=None,
-         val_set_pct=0.2, filter_by_class=None, backbone=None, name='model',
-         verbose=1):
+         val_set_pct=0.2, filter_by_class=None, backbone=None,
+         finetune_old_inp_dim=None, finetune_old_out_dim=None,
+         name='model', verbose=1,
+         ):
     if verbose > 0:
         utils.print_device_info()
 
@@ -48,7 +111,7 @@ def main(operation, data_dir, output_dir, model, model_fn, in_weights_path=None,
             tf.keras.utils.set_random_seed(seed)
 
     # tinyunet: nr_filters=32
-    model = create_model(
+    model_new = create_model(
         model, len(id2code), nr_bands, tensor_shape, nr_filters=32, loss=loss_function,
         alpha=tversky_alpha, beta=tversky_beta,
         dropout_rate_input=dropout_rate_input,
@@ -78,9 +141,15 @@ def main(operation, data_dir, output_dir, model, model_fn, in_weights_path=None,
                             num_parallel_calls=tf.data.AUTOTUNE)
                      .repeat())
 
-    # load weights if the model is supposed to do so
+    # load weights if the model is supposed to do so (i.e. fine-tune mode)
     if operation == 'fine-tune':
-        model.load_weights(in_weights_path)
+        load_pretrained_model(
+            model, id2code,
+            tensor_shape, loss_function, tversky_alpha, tversky_beta,
+            dropout_rate_input, dropout_rate_hidden, backbone, name,
+            in_weights_path, model_new,
+            finetune_old_inp_dim, finetune_old_out_dim
+        )
 
     #train_generator = AugmentGenerator(
     #    data_dir, batch_size, 'train', fit_memory=fit_memory,
@@ -105,7 +174,7 @@ def main(operation, data_dir, output_dir, model, model_fn, in_weights_path=None,
                        .map(Augment())
                        .prefetch(buffer_size=tf.data.AUTOTUNE))
 
-    train(model, train_generator, train_nr_samples, val_generator, val_nr_samples, id2code, batch_size,
+    train(model_new, train_generator, train_nr_samples, val_generator, val_nr_samples, id2code, batch_size,
           output_dir, visualization_path, model_fn, nr_epochs,
           initial_epoch, seed=seed, patience=patience,
           monitored_value=monitored_value, verbose=verbose)
@@ -294,13 +363,27 @@ def train(model, train_generator, train_nr_samples, val_generator, val_nr_sample
         '--backbone', type=str, default=None,
         choices=('ResNet50', 'ResNet101', 'ResNet152'),
         help='Backbone architecture')
-
+    parser.add_argument(
+        "--finetune_old_inp_dim", type=int, default=None,
+        help="Input dimension of pretrained model, used for finetuning. "
+             "Set if dimension changed in new/currently trained model."
+    )
+    parser.add_argument(
+        "--finetune_old_out_dim", type=int, default=None,
+        help="Output dimension of pretrained model, used for finetuning. "
+             "Set if dimension changed in new/currently trained model."
+    )
     args = parser.parse_args()
 
     # check required arguments by individual operations
     if args.operation == 'fine-tune' and args.weights_path is None:
         raise parser.error(
             'Argument weights_path required for operation == fine-tune')
+    if (args.finetune_old_inp_dim or args.finetune_old_out_dim) and args.operation != "fine-tune":
+        raise parser.error(
+            "Argument operation==fine-tune required for arguments "
+            "finetune_old_inp_dim or finetune_old_out_dim"
+        )
     if args.operation == 'train' and args.initial_epoch != 0:
         raise parser.error(
             'Argument initial_epoch must be 0 for operation == train')
@@ -325,4 +408,5 @@ def train(model, train_generator, train_nr_samples, val_generator, val_nr_sample
          args.augment_training_dataset, args.tversky_alpha,
          args.tversky_beta, args.dropout_rate_input,
          args.dropout_rate_hidden, args.validation_set_percentage,
-         args.filter_by_classes, args.backbone)
+         args.filter_by_classes, args.backbone,
+         args.finetune_old_inp_dim, args.finetune_old_out_dim)

From 67bd6ca7ef4e873d3c85963adbefb3e9acf8f792 Mon Sep 17 00:00:00 2001
From: linakrisztian <106728040+linakrisztian@users.noreply.github.com>
Date: Tue, 20 Aug 2024 14:14:43 +0200
Subject: [PATCH 3/5] add label_colors-txt filename as optional argument (#3)

---
 src/detect.py | 9 ++++++---
 src/train.py  | 9 ++++++---
 2 files changed, 12 insertions(+), 6 deletions(-)

diff --git a/src/detect.py b/src/detect.py
index c2e513a4..e142337c 100644
--- a/src/detect.py
+++ b/src/detect.py
@@ -16,7 +16,7 @@
 from cnn_exceptions import DatasetError
 
 
-def main(data_dir, model, in_weights_path, visualization_path, batch_size,
+def main(data_dir, label_colors, model, in_weights_path, visualization_path, batch_size,
          seed, tensor_shape, force_dataset_generation, fit_memory, val_set_pct,
          filter_by_class, backbone=None, ignore_masks=False):
     utils.print_device_info()
@@ -34,7 +34,7 @@ def main(data_dir, model, in_weights_path, visualization_path, batch_size,
     nr_bands = utils.get_nr_of_bands(data_dir)
 
     label_codes, label_names, id2code = utils.get_codings(
-        os.path.join(data_dir, 'label_colors.txt'))
+        os.path.join(data_dir, label_colors))
 
     # set TensorFlow seed
     tf.random.set_seed(seed)
@@ -124,6 +124,9 @@ def get_geoinfo(data_dir):
     parser.add_argument(
         '--data_dir', type=str, required=True,
         help='Path to the directory containing images and labels')
+    parser.add_argument(
+        "--label_colors", type=str, default="label_colors.txt",
+        help="Name of label colors txt file (located at top of --data-dir)")
     parser.add_argument(
         '--model', type=str, default='U-Net',
         choices=('U-Net', 'SegNet', 'DeepLab'),
@@ -188,7 +191,7 @@ def get_geoinfo(data_dir):
         raise parser.error(
             'Argument validation_set_percentage must be greater or equal to 0')
 
-    main(args.data_dir, args.model, args.weights_path, args.visualization_path,
+    main(args.data_dir, args.label_colors, args.model, args.weights_path, args.visualization_path,
          args.batch_size, args.seed, (args.tensor_height, args.tensor_width),
          args.force_dataset_generation, args.fit_dataset_in_memory,
          args.validation_set_percentage, args.filter_by_classes,
diff --git a/src/train.py b/src/train.py
index 4cc2e2f7..0640f296 100644
--- a/src/train.py
+++ b/src/train.py
@@ -83,7 +83,7 @@ def load_pretrained_model(model, id2code,
         # if model dimension did not chainged, load weights from complete model
         model_new.load_weights(in_weights_path)
 
-def main(operation, data_dir, output_dir, model, model_fn, in_weights_path=None,
+def main(operation, data_dir, output_dir, label_colors, model, model_fn, in_weights_path=None,
          visualization_path='/tmp', nr_epochs=1, initial_epoch=0, batch_size=1,
          loss_function='dice', seed=1, patience=100, tensor_shape=(256, 256),
          monitored_value='val_accuracy', force_dataset_generation=False,
@@ -100,7 +100,7 @@ def main(operation, data_dir, output_dir, model, model_fn, in_weights_path=None,
     nr_bands = utils.get_nr_of_bands(data_dir)
 
     label_codes, label_names, id2code = utils.get_codings(
-        os.path.join(data_dir, 'label_colors.txt'))
+        os.path.join(data_dir, label_colors))
 
     # set TensorFlow seed
     if seed is not None:
@@ -271,6 +271,9 @@ def train(model, train_generator, train_nr_samples, val_generator, val_nr_sample
     parser.add_argument(
         '--data_dir', type=str, required=True,
         help='Path to the directory containing images and labels')
+    parser.add_argument(
+        "--label_colors", type=str, default="label_colors.txt",
+        help="Name of label colors txt file (located at top of --data-dir)")
     parser.add_argument(
         '--output_dir', type=str, required=True, default=None,
         help='Path where logs and the model will be saved')
@@ -399,7 +402,7 @@ def train(model, train_generator, train_nr_samples, val_generator, val_nr_sample
             'Argument validation_set_percentage must be greater or equal to '
             '0 and smaller or equal than 1')
 
-    main(args.operation, args.data_dir, args.output_dir,
+    main(args.operation, args.data_dir, args.label_colors, args.output_dir,
          args.model, args.model_fn, args.weights_path, args.visualization_path,
          args.nr_epochs, args.initial_epoch, args.batch_size,
          args.loss_function, args.seed, args.patience,

From acf708534b636d3b57663ed5ca0d615d931f6fe6 Mon Sep 17 00:00:00 2001
From: linakrisztian <106728040+linakrisztian@users.noreply.github.com>
Date: Fri, 23 Aug 2024 12:53:12 +0200
Subject: [PATCH 4/5] fix order of parsing arguemtns (#4)

---
 src/train.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/train.py b/src/train.py
index 0640f296..6cb85f14 100644
--- a/src/train.py
+++ b/src/train.py
@@ -83,7 +83,7 @@ def load_pretrained_model(model, id2code,
         # if model dimension did not chainged, load weights from complete model
         model_new.load_weights(in_weights_path)
 
-def main(operation, data_dir, output_dir, label_colors, model, model_fn, in_weights_path=None,
+def main(operation, data_dir, label_colors, output_dir , model, model_fn, in_weights_path=None,
          visualization_path='/tmp', nr_epochs=1, initial_epoch=0, batch_size=1,
          loss_function='dice', seed=1, patience=100, tensor_shape=(256, 256),
          monitored_value='val_accuracy', force_dataset_generation=False,

From a84f12ed444f54c0e9bbcd48da20cc5157decf4e Mon Sep 17 00:00:00 2001
From: Lina Krisztian <krisztian@mundialis.de>
Date: Fri, 20 Dec 2024 12:55:55 +0100
Subject: [PATCH 5/5] if input vrt export with tif file ending

---
 src/visualization.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/visualization.py b/src/visualization.py
index 55517e87..476d8784 100644
--- a/src/visualization.py
+++ b/src/visualization.py
@@ -206,7 +206,7 @@ def visualize_detections(images, ground_truths, detections, id2code,
 
         # THE DETECTION TIF IMAGE SECTION
 
-        out = driver.Create(os.path.join(out_dir, f'{geoinfos[i][0]}'),
+        out = driver.Create(os.path.join(out_dir, f"{geoinfos[i][0].replace('.vrt','.tif')}"),
                             np.shape(detections)[2],
                             np.shape(detections)[1],
                             1,