CoastlineExtraction/ndwi_labels.py at master · LJitendra05/CoastlineExtraction · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
# import libraries
import rasterio as rio
from rasterio import mask
from rasterio.plot import show
from rasterio.mask import mask
from rasterio.io import MemoryFile
import shapely
from shapely.geometry import Polygon, shape ,box
import geopandas as gpd
import os
from matplotlib import pyplot as plt
import numpy as np
import cv2

# Add import for config loading
from load_config import load_config, get_image_path, get_shapefile_path

# Add import for check_crs
from utils.check_crs import check_crs, crs_match

# Add import for spatial analysis
from utils.spatial_analysis import log_spatial_info

# Add import for shapefile generation
from utils.shapefile_generator import coastline_shp_from_raster, save_and_process, save_concatenated_ndwi_with_shapefile


# Gaussian blur parameters
KSIZE_BLUR = (9, 9)  # Kernel size (must be positive and odd)
SIGMA_X = 6      # Standard deviation in X direction
SIGMA_Y = 6      # Standard deviation in Y direction

MAJORITY_THRESHOLD = 0.55


def get_ndwi_label(image_path, points_path, ksize=100, blurring=True):
    """
    This function performs NDWI calculation and classification with optional Gaussian blurring.

    Steps:
    1. Read green and NIR bands to calculate NDWI.
    2. Apply Gaussian blurring if required.
    3. Match points CRS with raster.
    4. Create a buffer around each point (number of buffers depends on the number of points in the shapefile).
    5. Mask the NDWI image with the specified buffer (sliding window).
        5.1 out_image: same shape as the original image with the specified buffer.
        5.2 out_image_clipped: clipped to the buffer.
            If the entire buffer is inside the NDWI image, its shape should be (201, 201).
            If all or part of the sliding window is outside the NDWI image, the shape will be smaller.
    6. Skip sliding windows that are not entirely inside the NDWI image.
    7. Calculate threshold based on the clipped image.
    8. Apply OR operations between `out_image` to form the final labeled image.
    9. Note that the NDWI threshold value may be less than 128.
       Therefore, it is crucial to substitute no data with -1.
    10. Apply majority rule on the number of windows to segment pixels as water.
    11. Concatenate the remaining sliding window images (unlabeled parts) from NDWI classified.
    """


    # Check CRS of input files
    check_crs(image_path, verbose=True)
    check_crs(points_path, verbose=True)


    # Establish the NDWI calculation and copy metadata
    with rio.open(image_path, driver='GTiff') as src_raster:
        green = src_raster.read(2).astype(np.float32)  # Get the green band
        nir_num = src_raster.count  # Adjusting NIR band to 4 or 5 band images
        nir = src_raster.read(nir_num).astype(np.float32)  # Get NIR band

        np.seterr(divide='ignore', invalid='ignore')

        ndwi = (green - nir) / (green + nir)  # NDWI equation
        ndwi[np.isnan(ndwi)] = 0  # Sets any NaN values in the NDWI array to 0. (Dividing by zero => NaN pixels)
        ndwi_profile = src_raster.profile  # Copies the image profile (metadata).

        # Apply Gaussian blur
        if blurring:
            print("Gaussian Filtering Applied")
            ndwi = cv2.GaussianBlur(ndwi, KSIZE_BLUR, SIGMA_X, SIGMA_Y)

        # Blank label layer
        label = np.zeros((src_raster.height, src_raster.width)).astype(np.uint8)
        # Buffer matrix: each element represents the number of times a sliding window moves over a specific pixel.
        buffer_numbers = np.zeros((src_raster.height, src_raster.width)).astype(np.uint8)
        # Water count matrix: each pixel value represents the number of times pixels are labelled as water.
        water_count = np.zeros((src_raster.height, src_raster.width)).astype(np.uint8)
        src_CRS = src_raster.crs

        # Getting pixel size for correct calculation of buffer.
        # This value expresses spatial resolution.
        pixel_size = abs(src_raster.transform[0])

        # Fix: retrieve bounds while raster file is open
        raster_bounds = src_raster.bounds

    # Preparing points for creating label masks
    points_shp = gpd.read_file(points_path)
    points_geom = points_shp.geometry
    points_geom = points_geom.set_crs(epsg=4326)  # Set CRS to WGS84
    points_geom = points_geom.to_crs(src_CRS)  # Convert CRS to match the raster

    # Before saving the file
    output_dir = "result_ndwi_labels"
    os.makedirs(output_dir, exist_ok=True)  # This will create the directory if it doesn't exist

    # Define the path for saving the reprojected vector (shapefile) after CRS alignment
    reprojected_points_path = os.path.join(output_dir, "reprojected_points.shp")
    # Save the reprojected point geometries into a new shapefile
    gpd.GeoDataFrame(geometry=points_geom).to_file(reprojected_points_path)

    # Use crs_match to check CRS of the raster and the reprojected vector file
    # IMPORTANT: Pass the path to the reprojected file, NOT the original file, to crs_match.
    if not crs_match(image_path, reprojected_points_path):
        raise ValueError("CRS mismatch after conversion! Check your input files and CRS conversion steps.")


    # Log spatial info once, outside the main loop
    log_spatial_info(raster_bounds, points_geom)

    otsu_thresholds_clipped = []  # Creating a holder for Otsu's threshold values for clipped images
    skipped = 0  # Counter for skipped windows (less than 201*201)

    # Processing each point found
    for multipoint in points_geom:
        for point in multipoint.geoms:
            # Create a buffer around the point
            buffer = point.buffer(ksize * pixel_size, cap_style=3)
            buffer_series = gpd.GeoSeries(buffer)

            # Writing NDWI to an in-memory dataset to use for masking
            ndwi_profile.update(count=1, nodata=0, dtype=rio.float32)
            with MemoryFile() as memfile:
                with memfile.open(**ndwi_profile) as mem_data:
                    mem_data.write_band(1, ndwi)
                with memfile.open() as dataset:

                    # Get raster bounds as a shapely geometry
                    raster_bounds_geom = box(*dataset.bounds)

                    # Check if the point's buffer intersects with the raster's bounds before masking - Added intersection()
                    if buffer.intersects(raster_bounds_geom):
                        out_image, out_transform = mask(dataset, shapes=[buffer], nodata=-1, crop=False)
                        out_image = out_image[0]
                        out_image = (out_image * 127) + 128
                        out_image = out_image.astype(np.uint8)

                        out_image_clipped, out_transform_clipped = mask(dataset, shapes=[buffer], nodata=-1, crop=True)
                        out_image_clipped = out_image_clipped[0]
                        out_image_clipped = (out_image_clipped * 127) + 128
                        out_image_clipped = out_image_clipped.astype(np.uint8)

                        # Mask array: mask pixels within the sliding window with 1, else 0
                        mask_array = np.copy(out_image)
                        mask_value = 1
                        mask_array = np.where(mask_array == mask_value, 0, 1)

                        # Skip buffering windows that are partly or wholly out of the NDWI image
                        if out_image_clipped.shape[0] < 200 or out_image_clipped.shape[1] < 200:
                            skipped += 1
                            continue

                        else:
                            # Calculate Otsu's threshold based on the clipped image
                            threshold_clipped, image_result_clipped = cv2.threshold(out_image_clipped, 0, 1, cv2.THRESH_BINARY + cv2.THRESH_OTSU)
                            otsu_thresholds_clipped.append(threshold_clipped)
                            threshold_window = np.where(out_image >= threshold_clipped, 1, 0).astype(np.uint8)
                            label = label | threshold_window.astype(np.uint8)  # Labelled image with sliding windows

                            water_count = water_count + threshold_window
                            buffer_numbers = buffer_numbers + mask_array

                    else:
                        # If the buffer does not intersect, skip to the next point
                        skipped += 1
                        continue


    # Labelled images based on majority sliding windows
    label_majority = np.where(water_count > (buffer_numbers * MAJORITY_THRESHOLD), 1, 0)

    # Labelled image based on mean threshold (one threshold)
    mean_threshold = np.mean(otsu_thresholds_clipped) + 10
    ndwi_8bit = ((ndwi * 127) + 128).astype(np.uint8)
    ndwi_classified = np.where(ndwi_8bit >= mean_threshold, 1, 0)

    # Concatenate the remaining sliding window images (unlabeled parts) from NDWI classified.
    sliding_windows = np.where(buffer_numbers > 0, 1, 0)
    ndwi_concatenated = np.where(sliding_windows == 1, label, ndwi_classified)

    print(f"Green min: {green.min():.2f}, Green max: {green.max():.2f}")
    print(f"NIR min: {nir.min():.2f}, NIR max: {nir.max():.2f}")
    print(f"NDWI min: {ndwi.min():.2f}, NDWI max: {ndwi.max():.2f}")  # From -1 to +1

    print(f"Total number of valid thresholds: {len(otsu_thresholds_clipped)}")
    print(f"Number of skipped windows: {skipped}")

    print(f"Actual thresholds (8-bit unsigned): {otsu_thresholds_clipped}")
    print(f"Average threshold value (8-bit unsigned): {np.mean(otsu_thresholds_clipped)}")
    print(f"Average threshold value (-1 to 1 NDWI range): {(np.mean(otsu_thresholds_clipped) - 128) / 127}")

    print(f"Label min: {np.nanmin(label)} , max: {np.nanmax(label)}")


    # Save concatenated NDWI as TIFF and generate shapefile
    save_concatenated_ndwi_with_shapefile(ndwi_concatenated, ndwi_profile, image_path)


    save_ndwi_plots(ndwi, ndwi_classified, label, label_majority, ndwi_concatenated)


def save_ndwi_plots(ndwi, ndwi_classified, label, label_majority, ndwi_concatenated, out_dir="result_ndwi_labels"):
    """
    Saves and visualizes the results of NDWI classification and labeling.

    This function generates and saves plots for different NDWI-based classification outputs:
      - The raw NDWI image.
      - The NDWI image classified using a mean threshold.
      - The NDWI image labeled using a sliding window approach.
      - The NDWI image labeled using a majority rule on sliding windows.
      - A concatenated image combining sliding window and mean threshold results.
    All plots are saved as PNG files in the specified output directory.

    Args:
        ndwi: The computed NDWI image (2D numpy array).
        ndwi_classified: Binary NDWI image classified by mean threshold (2D numpy array).
        label: Binary NDWI image labeled by sliding window (2D numpy array).
        label_majority: Binary NDWI image labeled by majority rule (2D numpy array).
        ndwi_concatenated: Combined NDWI classification result (2D numpy array).
        out_dir: Directory to save the output plots (default: 'result_ndwi_labels').
    """
    os.makedirs(out_dir, exist_ok=True)

    plt.imshow(ndwi)
    plt.title("NDWI Image")
    plt.axis("off")
    plt.savefig(os.path.join(out_dir, "ndwi_image.png"))
    plt.close()

    fig, axs = plt.subplots(2, 2, figsize=(18, 14))

    axs[0, 0].imshow(ndwi_classified)
    axs[0, 0].set_title('NDWI Classified with mean threshold')
    axs[0, 0].axis('off')

    # Plot labelled image (based on sliding windows)
    axs[0, 1].imshow(label)
    axs[0, 1].set_title('NDWI Classified with sliding window')
    axs[0, 1].axis('off')

    # Plot labelled image (based on majority sliding windows)
    axs[1, 0].imshow(label_majority)
    axs[1, 0].set_title('NDWI Classified with majority sliding window')
    axs[1, 0].axis('off')

    # Plot NDWI classified concatenated between majority sliding windows with one mean threshold
    axs[1, 1].imshow(ndwi_concatenated)
    axs[1, 1].set_title('NDWI Concatenated')
    axs[1, 1].axis('off')

    # Save NDWI concatenated as a separate PNG
    plt.figure(figsize=(10, 8))
    plt.imshow(ndwi_concatenated)
    plt.axis('off')
    plt.savefig(os.path.join(out_dir, "ndwi_concatenated.png"), bbox_inches='tight', pad_inches=0)
    plt.close()

    plt.tight_layout()
    fig.savefig(os.path.join(out_dir, "ndwi_outputs_summary.png"))
    plt.close()


boundary = {'type': 'Polygon',
            'coordinates': [[[-162.8235626220703, 66.05622435812153],
                             [-162.674560546875, 66.05622435812153],
                             [-162.674560546875, 66.10883816429516],
                             [-162.8235626220703, 66.10883816429516],
                             [-162.8235626220703, 66.05622435812153]]]}


"""
To run this script:
Change the index number (the second argument in get_image_path and get_shapefile_path)
according to the file you want to process, as specified in your config_template.json.
"""
config = load_config()
image_path = get_image_path(config, 0)  # 268898_0369619_2016-10-15_0e14_BGRN_SR_clip.tif
points_path = get_shapefile_path(config, 0)  # Deering_transect_points_2016_fw.shp

get_ndwi_label(image_path, points_path)