CapstoneProject-ImageClassification-LULC/visualisation_ourdata.py at main · Shifat7/CapstoneProject-ImageClassification-LULC · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
# Credit to SSLTransformerRS GitHub repo

import json
import os
import csv
import numpy as np
import torch
import torch.nn.functional as F
import torch.nn as nn
from distutils.util import strtobool
from tqdm import tqdm
from torchvision.models import resnet18, resnet50
import rasterio

from dfc_dataset_sandbox import DFCDataset # use sandbox version

from Transformer_SSL.models.swin_transformer import * # refine to classes required
from utils import dotdictify
from Transformer_SSL.models import build_model
from PyQt5.QtCore import QThread, pyqtSignal
import time


class SegmentationThread(QThread):
    errorSignal = pyqtSignal(str)
    finishedSignal = pyqtSignal(str)
    progressSignal = pyqtSignal(int)
    resetProgressSignal = pyqtSignal()
    updatePieChartSignal = pyqtSignal(object)

    def __init__(self, model_file_path, patch_names):
        super(SegmentationThread, self).__init__()
        print("Patch Names:", patch_names)
        print("Model File Path:", model_file_path)
        self.model_file_path = model_file_path or "swin-t-pixel-classification-final-epoch-200.pth"
        self.patch_names = patch_names
        self.is_stopped = False
        self.is_paused = False

    def run(self):
        try:

                print (self.patch_names)
                if torch.cuda.is_available():
                    device = torch.device("cuda")
                else:
                    device = torch.device("cpu:0")

                with open("configs/backbone_config.json", "r") as fp: # need to include this file!!!
                    swin_conf = dotdictify(json.load(fp))

                s1_backbone = build_model(swin_conf.model_config)

                swin_conf.model_config.MODEL.SWIN.IN_CHANS = 13
                s2_backbone = build_model(swin_conf.model_config)

                    # Data configurations:
                data_config = {
                        'train_dir': 'splits/', # path to the training directory, this is "ROIs0000_validation" as currently configured,
                        'val_dir': 'splits/', # path to the validation directory, this is "ROIs0000_test" as currently configured,
                        'train_mode': 'validation', # can be one of the following: 'test', 'validation'
                        'val_mode': 'test', # can be one of the following: 'test', 'validation'
                        'num_classes': 8, # number of classes in the dataset.
                        'clip_sample_values': True, # clip (limit) values
                        'train_used_data_fraction': 1, # fraction of data to use, should be in the range [0, 1]
                        'val_used_data_fraction': 1,
                        'image_px_size': 224, # image size (224x224)
                        'cover_all_parts_train': True, # if True, if image_px_size is not 224 during training, we use a random crop of the image
                        'cover_all_parts_validation': True, # if True, if image_px_size is not 224 during validation, we use a non-overlapping sliding window to cover the entire image
                        'seed': 42,
                    }

                val_dataset = DFCDataset(
                        data_config['val_dir'],
                        mode=data_config['val_mode'],
                        clip_sample_values=data_config['clip_sample_values'],
                        used_data_fraction=data_config['val_used_data_fraction'],
                        image_px_size=data_config['image_px_size'],
                        cover_all_parts=data_config['cover_all_parts_validation'],
                        seed=data_config['seed'],
                    )


                    # create a new model's instance
                model = DoubleSwinTransformerSegmentationS2(s2_backbone, out_dim=data_config['num_classes'], device=device)

                    # load desired segmentation checkpoint (pick in GUI)

                # model.load_state_dict(torch.load("swin-t-pixel-classification-final-epoch-200.pth", map_location='cpu')) # replace path with desired checkpoint

                # print(type(self.model_file_path), self.model_file_path)
                model.load_state_dict(torch.load(self.model_file_path, map_location='cpu'))
                model.to(device)

                    # array of patch names (feed in from input.csv file or pick in GUI)
                    #patch_names = ['S2A_MSIL2A_20220108T002711_R016_T54HWF_20220110T213759_combined_01_01', 'S2A_MSIL2A_20220108T002711_R016_T54HWF_20220110T213759_combined_01_02']

                input_folder = os.path.join('input') # set input folder for complete data set (i.e., entire state)
                    # patch_names = [file for file in os.listdir(input_folder) if file.endswith('.tif')] # all patches under input directory

                all_output_arrays = []
                for index, patch_name in enumerate(self.patch_names):
                        print("Patch name: " + patch_name)

                        progress_percentage = int((index + 1) / len(self.patch_names) * 100)
                        self.progressSignal.emit(progress_percentage)

                        patch_file = os.path.join(input_folder, patch_name)

                        # adapted from dfc_sen12ms_dataset
                        with rasterio.open(patch_file) as patch:
                            patch_data = patch.read()
                            bounds = patch.bounds

                        mpc_tensor = torch.from_numpy(patch_data.astype('float32')) # create input tensor of float32 values

                        # Code for normalisation of patch - credit dfc_dataset.py
                        s2_maxs = []
                        for b_idx in range(mpc_tensor.shape[0]):
                            s2_maxs.append(
                                torch.ones((mpc_tensor.shape[-2], mpc_tensor.shape[-1])) * mpc_tensor[b_idx].max().item() + 1e-5
                            )
                        s2_maxs = torch.stack(s2_maxs)

                        mpc_tensor = mpc_tensor / s2_maxs

                        mpc_tensor = torch.unsqueeze(mpc_tensor, 0) # add dimension at first position

                        print(mpc_tensor)
                        print(mpc_tensor.shape) # output is now [1, 13, 224, 224] as desired

                        # control logic

                        if self.is_stopped:
                                print("Stop flag detected. Select the patches to start the segmentation again")
                                self.resetProgressSignal.emit()
                                return

                        if self.is_paused:
                                print("Segmentation is paused")

                        while self.is_paused:
                                time.sleep(1)


                        if mpc_tensor.shape != [1, 13, 224, 224]:
                            x_l = 224 - mpc_tensor.size(dim=2) # amount needing to be added to x
                            y_l = 224 - mpc_tensor.size(dim=3) # amount needing to be added to y

                            a = True
                            try:
                                mpc_tensor[0, 1, 0, 223]
                            except:
                                a = False

                            b = True
                            try:
                                mpc_tensor[0, 1, 223, 223]
                            except:
                                b = False

                            c = True
                            try:
                                mpc_tensor[0, 1, 0, 0]
                            except:
                                c = False

                            d = True
                            try:
                                mpc_tensor[0, 1, 223, 0]
                            except:
                                d = False

                            if a and b: # if (1, 224) and (224, 224) exist [bottom edge]
                                mpc_tensor = F.pad(mpc_tensor, (y_l, 0, 0, 0, 0, 0, 0, 0), "constant", 0) # prepend difference to y
                            elif c and d: # if (1, 1) and (224, 1) exist [top edge]
                                mpc_tensor = F.pad(mpc_tensor, (0, y_l, 0, 0, 0, 0, 0, 0), "constant", 0) # append difference to y
                            elif b and d: # if (224, 224) and (224, 1) exist [right edge]
                                mpc_tensor = F.pad(mpc_tensor, (0, 0, x_l, 0, 0, 0, 0, 0), "constant", 0) # prepend difference to x
                            elif c and a: # if (1, 1) and (1, 224) exist [left edge]
                                mpc_tensor = F.pad(mpc_tensor, (0, 0, 0, x_l, 0, 0, 0, 0), "constant", 0) # append difference to x
                            else:
                                if a: # if (1, 224) exists
                                    mpc_tensor = F.pad(mpc_tensor, (y_l, 0, 0, x_l, 0, 0, 0, 0), "constant", 0) # append difference to x, prepend differece to y | note values in sequence are flipped
                                elif b: # if (224, 224) exists
                                    mpc_tensor = F.pad(mpc_tensor, (y_l, 0, x_l, 0, 0, 0, 0, 0), "constant", 0) # prepend difference to x, prepend difference to y
                                elif d: # check (224, 1) exists
                                    mpc_tensor = F.pad(mpc_tensor, (0, y_l, x_l, 0, 0, 0, 0, 0), "constant", 0) # prepend difference to x, append difference to y
                                elif c: # check (1, 1) exists
                                    mpc_tensor = F.pad(mpc_tensor, (0, y_l, 0, x_l, 0, 0, 0, 0), "constant", 0) # append difference to x, append difference to y
                            # print(mpc_tensor)
                            # print(mpc_tensor.shape)
                        patch_img = {"s2": mpc_tensor} # create dictionary using same format as DFC

                        # evaluate using model
                        model.eval() # sets the model in evaluation mode
                        output = model(patch_img) # pass input to model, 'output' is instance of DoubleSwinTransformerSegmentation
                        #output = model(img)


                        test = torch.max(output, dim=1)
                        #print(test.indices)

                        output_arrays = test.indices.squeeze()
                        all_output_arrays.append(output_arrays.cpu().numpy())


                        # CSV OUTPUT

                        # Get the spatial information from the GeoTIFF file
                        with rasterio.open(patch_file) as current_patch:
                            metadata = current_patch.meta
                            transform = current_patch.transform

                        # Create the "output" folder if it doesn't exist
                        output_folder = "output"
                        os.makedirs(output_folder, exist_ok=True)

                        # Get the filename of the current TIF patch
                        print("Patch name: " + patch_name)
                        tif_filename = patch_name

                        # Remove the file extension to use as data_info
                        data_info = os.path.splitext(tif_filename)[0]

                        # Generate the dynamic CSV filename
                        csv_filename = os.path.join(output_folder, f"output_data_{data_info}.csv")

                        # Create a CSV file inside the "output" folder for writing
                        with open(csv_filename, mode='w', newline='') as csv_file:
                            csv_writer = csv.writer(csv_file)

                            # Write a header row with column names
                            csv_writer.writerow(["Latitude", "Longitude", "Class"])

                            # Loop through the rows of output_arrays
                            for row_index, row in enumerate(output_arrays):
                                for col_index, class_value in enumerate(row):
                                    # Calculate the geographic coordinates for each pixel
                                    pixel_coordinates = transform * (col_index, row_index)

                                    # Convert tensor element to a Python scalar
                                    class_value_scalar = class_value.item()

                                    # Write the coordinates and class value to the CSV file
                                    csv_writer.writerow([pixel_coordinates[0], pixel_coordinates[1], class_value_scalar])


                        # Print a message indicating the CSV file was created
                        print(f"CSV file '{csv_filename}' created.")

                        # ADD BAND TO GEOTIFF WITH SEGMENTATION CLASSES

                        # Create a new GeoTIFF file with an additional band for segmentation classes
                        # We can setup to overwrite the old patch here or delete the old patch after to save space
                        output_tif_filename = os.path.join(output_folder, f"output_patch_{patch_name}")

                        # Create a copy of the input patch as a starting point for the output patch
                        with rasterio.open(patch_file) as input_patch:
                            output_meta = input_patch.meta
                            output_meta['count'] += 1  # Increment the number of bands for the new class band

                            with rasterio.open(output_tif_filename, 'w', **output_meta) as output_patch:
                                # Copy the existing bands to the new GeoTIFF
                                for i in range(1, input_patch.count + 1):
                                    output_patch.write(input_patch.read(i), i)

                                # Add the segmentation classes as an additional band (band number is input_patch.count + 1)
                                output_patch.write(output_arrays, input_patch.count + 1)

                        print(f"GeoTIFF file '{output_tif_filename}' created.")

                        npy_output_folder = "npy_outputs"
                        os.makedirs(npy_output_folder, exist_ok=True)
                        self.updatePieChartSignal.emit(all_output_arrays)
                        combined_npy_filename = os.path.join(npy_output_folder, "all_output_arrays.npy")
                        np.save(combined_npy_filename, all_output_arrays)


                        print(f"All arrays saved to '{combined_npy_filename}'.")

                # VISUALISATION CODE
                # val_dataset.test_visual_mpc(mpc_tensor, output_arrays)

                self.finishedSignal.emit("Segmentation Finished!")

        except Exception as e:
            self.errorSignal.emit(str(e))

    def pause(self):
        print("Setting pause flag.")
        self.is_paused = True

    def resume(self):
        print("Clearing pause flag.")
        self.is_paused = False

    def stop(self):
        print("Setting stop flag.")
        self.is_paused = False
        self.is_stopped = True