# Importing the required libraries

import rasterio  # For reading and working with raster data
import numpy as np  # For numerical operations, including NDVI calculation
import seaborn as sns #For generating graphs
import matplotlib.pyplot as plt  # For displaying images
import seaborn as sns  # For enhanced visualization (optional)
import geopandas as gpd  # For working with shapefiles
import pandas as pd #For CSV file edit
import rasterio.features #For feature extraction
from rasterio.plot import show  # For displaying raster data easily
from shapely.geometry import box  # For creating bounding box for clipping
from shapely.ops import unary_union #For shapefile adjustment
from shapely.geometry import Polygon #For adjustment of polygons
from rasterio.mask import mask  # For masking and cropping rasters with shapefiles
from mpl_toolkits.axes_grid1 import make_axes_locatable #For adjusting colorbar size

# File path to the Red band raster
red_band_path = r"C:\Users\15302\Downloads\DrKisekka_Tomato\Data\08-06-2024_DrKisekka-Tomato_Farm_transparent_reflectance_red.tif"

# Open the Red band using rasterio
with rasterio.open(red_band_path) as red_band:
    red_band_data = red_band.read(1)  # Read the first (and only) band
    red_band_meta = red_band.meta  # Metadata of the red band

# Replace negative values with 0
red_band_data = np.clip(red_band_data, 0, None)

# Check the actual pixel value range after clipping
min_value = np.min(red_band_data)
max_value = np.max(red_band_data)

# Print out the new range of values
print(f"Minimum pixel value after clipping: {min_value}")
print(f"Maximum pixel value after clipping: {max_value}")

# Set the minimum and maximum values for display (adjust brightness based on actual pixel range)
vmin, vmax = min_value, min_value + 0.02  # Small range based on min value

# Create the plot
fig, ax = plt.subplots(figsize=(10, 8))
plt.title("Red Band - 08-06-2024 Tomato Farm (Brightness Adjusted, Negative Values Clipped)")
img = ax.imshow(red_band_data, cmap='Reds', vmin=vmin, vmax=vmax)

# Turn off axis numbers
ax.set_xticks([])
ax.set_yticks([])

# Make the color bar shorter using make_axes_locatable
divider = make_axes_locatable(ax)
cax = divider.append_axes("right", size="5%", pad=0.05)  # Adjust size and pad for the colorbar
cbar = fig.colorbar(img, cax=cax)
cbar.set_label("Reflectance")

plt.show()

Minimum pixel value after clipping: 0.0
Maximum pixel value after clipping: 0.05971386656165123

# File path to the NIR band raster
nir_band_path = r"C:\Users\15302\Downloads\DrKisekka_Tomato\Data\08-06-2024_DrKisekka-Tomato_Farm_transparent_reflectance_nir.tif"

# Open the NIR band using rasterio
with rasterio.open(nir_band_path) as nir_band:
    nir_band_data = nir_band.read(1)  # Read the first (and only) band
    nir_band_meta = nir_band.meta  # Metadata of the NIR band

# Replace negative values with 0
nir_band_data = np.clip(nir_band_data, 0, None)

# Check the actual pixel value range after clipping
min_value = np.min(nir_band_data)
max_value = np.max(nir_band_data)

# Print out the new range of values
print(f"Minimum pixel value after clipping: {min_value}")
print(f"Maximum pixel value after clipping: {max_value}")

# Set the minimum and maximum values for display (adjust brightness based on actual pixel range)
vmin, vmax = min_value, min_value + 0.08  # Small range based on min value

# Create the plot
fig, ax = plt.subplots(figsize=(10, 8))
plt.title("NIR Band - 08-06-2024 Tomato Farm (Brightness Adjusted, Negative Values Clipped)")
img = ax.imshow(nir_band_data, cmap='Purples', vmin=vmin, vmax=vmax)  # Using 'Purples' for NIR band

# Turn off axis numbers
ax.set_xticks([])
ax.set_yticks([])

# Make the color bar shorter using make_axes_locatable
divider = make_axes_locatable(ax)
cax = divider.append_axes("right", size="5%", pad=0.05)  # Adjust size and pad for the colorbar
cbar = fig.colorbar(img, cax=cax)
cbar.set_label("Reflectance")

plt.show()

Minimum pixel value after clipping: 0.0
Maximum pixel value after clipping: 0.12740455567836761

# File paths to the Red and NIR band rasters
red_band_path = r"C:\Users\15302\Downloads\DrKisekka_Tomato\Data\08-06-2024_DrKisekka-Tomato_Farm_transparent_reflectance_red.tif"
nir_band_path = r"C:\Users\15302\Downloads\DrKisekka_Tomato\Data\08-06-2024_DrKisekka-Tomato_Farm_transparent_reflectance_nir.tif"

# Open and read the Red band
with rasterio.open(red_band_path) as red_band:
    red_band_data = red_band.read(1)
    red_band_data = np.clip(red_band_data, 0, None)  # Replace negative values with 0

# Open and read the NIR band
with rasterio.open(nir_band_path) as nir_band:
    nir_band_data = nir_band.read(1)
    nir_band_data = np.clip(nir_band_data, 0, None)  # Replace negative values with 0

# Calculate NDVI
ndvi = (nir_band_data - red_band_data) / (nir_band_data + red_band_data + 1e-10)  # Small epsilon added to avoid division by zero

# Set the range for NDVI values to -1 to 1
ndvi = np.clip(ndvi, -1, 1)

# Display NDVI using matplotlib
fig, ax = plt.subplots(figsize=(10, 8))
plt.title("NDVI - 08-06-2024 Tomato Farm")
img = ax.imshow(ndvi, cmap='RdYlGn', vmin=0, vmax=1)  # Using RdYlGn color map for NDVI

# Turn off axis numbers
ax.set_xticks([])
ax.set_yticks([])

# Make the color bar shorter using make_axes_locatable
divider = make_axes_locatable(ax)
cax = divider.append_axes("right", size="5%", pad=0.05)  # Adjust size and pad for the colorbar
cbar = fig.colorbar(img, cax=cax)
cbar.set_label("NDVI Value")

plt.show()

# File path to the shapefile
shapefile_path = r"C:\Users\15302\Downloads\DrKisekka_Tomato\SHP\DrKisekka_Tomato\Procedures\Shapefile\polygons_shapefile\polygons_shapefile.shp"

# Read the shapefile using geopandas
shapefile = gpd.read_file(shapefile_path)

# Print the metadata of the shapefile
print("Shapefile Metadata:")
print(f"Coordinate Reference System (CRS): {shapefile.crs}")
print(f"Number of features (geometries): {len(shapefile)}")
print(f"Columns (Attributes): {list(shapefile.columns)}")

# Display the first few rows of the shapefile's attribute table
print("\nShapefile Attribute Table (First 5 rows):")
print(shapefile.head())

Shapefile Metadata:
Coordinate Reference System (CRS): EPSG:32610
Number of features (geometries): 126
Columns (Attributes): ['T_ID', 'T_row', 'T_col', 'geometry']

Shapefile Attribute Table (First 5 rows):
   T_ID  T_row  T_col                                           geometry
0     1      1      1  POLYGON ((606242.702 4265896.773, 606244.167 4...
1     2      1      2  POLYGON ((606242.599 4265874.444, 606244.064 4...
2     3      2      1  POLYGON ((606244.166 4265896.751, 606245.631 4...
3     4      2      2  POLYGON ((606244.064 4265874.422, 606245.528 4...
4     5      3      1  POLYGON ((606245.631 4265896.730, 606247.096 4...

# File path to the original shapefile
shapefile_path = r"C:\Users\15302\Downloads\DrKisekka_Tomato\SHP\DrKisekka_Tomato\Procedures\Shapefile\polygons_shapefile\polygons_shapefile.shp"

# Read the shapefile using geopandas
shapefile = gpd.read_file(shapefile_path)

# Apply a small buffer to close any tiny gaps between polygons
shapefile['geometry'] = shapefile['geometry'].buffer(0.01)

# Group the polygons by 'T_row' and merge the geometries for each group
def merge_and_simplify(group):
    merged = unary_union(group)
    if merged.geom_type == 'MultiPolygon':
        # Simplify MultiPolygon by taking the convex hull or bounding box to merge them properly
        merged = Polygon(merged.convex_hull)
    return merged

merged_polygons = shapefile.groupby('T_row').agg({
    'geometry': lambda g: merge_and_simplify(g)  # Merge and simplify geometries for each T_row
}).reset_index()

# Merge the new geometry back into the original data, and make sure it's a GeoDataFrame
merged_shapefile = shapefile.drop(columns='geometry').drop_duplicates(subset='T_row').merge(merged_polygons, on='T_row')

# Convert the merged result back to a GeoDataFrame
merged_shapefile = gpd.GeoDataFrame(merged_shapefile, geometry='geometry', crs=shapefile.crs)

# Output path for the updated shapefile
output_path = r"C:\Users\15302\Downloads\DrKisekka_Tomato\SHP\DrKisekka_Tomato\Procedures\Shapefile\polygons_shapefile_Updated\polygons_shapefile_Updated.shp"

# Save the updated shapefile to the specified directory
merged_shapefile.to_file(output_path)

# Print the metadata of the shapefile
print("Shapefile Metadata:")
print(f"Coordinate Reference System (CRS): {merged_shapefile.crs}")
print(f"Number of features (geometries): {len(merged_shapefile)}")
print(f"Columns (Attributes): {list(merged_shapefile.columns)}")

# Display the first few rows of the shapefile's attribute table
print("\nShapefile Attribute Table (First 5 rows):")
print(merged_shapefile.head())

Shapefile Metadata:
Coordinate Reference System (CRS): EPSG:32610
Number of features (geometries): 63
Columns (Attributes): ['T_ID', 'T_row', 'T_col', 'geometry']

Shapefile Attribute Table (First 5 rows):
   T_ID  T_row  T_col                                           geometry
0     1      1      1  POLYGON ((606242.589 4265874.444, 606242.692 4...
1     3      2      1  POLYGON ((606245.538 4265874.416, 606245.435 4...
2     5      3      1  POLYGON ((606245.518 4265874.401, 606245.621 4...
3     7      4      1  POLYGON ((606248.468 4265874.373, 606248.365 4...
4     9      5      1  POLYGON ((606249.933 4265874.351, 606249.830 4...

# File paths to the Red and NIR band rasters
red_band_path = r"C:\Users\15302\Downloads\DrKisekka_Tomato\Data\08-06-2024_DrKisekka-Tomato_Farm_transparent_reflectance_red.tif"
nir_band_path = r"C:\Users\15302\Downloads\DrKisekka_Tomato\Data\08-06-2024_DrKisekka-Tomato_Farm_transparent_reflectance_nir.tif"

# File path to the updated shapefile
shapefile_path = r"C:\Users\15302\Downloads\DrKisekka_Tomato\SHP\DrKisekka_Tomato\Procedures\Shapefile\polygons_shapefile_Updated\polygons_shapefile_Updated.shp"

# Open and read the Red band
with rasterio.open(red_band_path) as red_band:
    red_band_data = red_band.read(1)
    red_band_data = np.clip(red_band_data, 0, None)  # Replace negative values with 0
    ndvi_crs = red_band.crs  # Get the CRS of the NDVI data
    ndvi_bounds = red_band.bounds  # Get the extent (bounds) of the raster

# Open and read the NIR band
with rasterio.open(nir_band_path) as nir_band:
    nir_band_data = nir_band.read(1)
    nir_band_data = np.clip(nir_band_data, 0, None)  # Replace negative values with 0

# Calculate NDVI
ndvi = (nir_band_data - red_band_data) / (nir_band_data + red_band_data + 1e-10)  # Small epsilon added to avoid division by zero

# Set the range for NDVI values to -1 to 1
ndvi = np.clip(ndvi, -1, 1)

# Read the updated shapefile with geopandas
shapefile = gpd.read_file(shapefile_path)

# Reproject the shapefile to match the NDVI CRS if necessary
if shapefile.crs != ndvi_crs:
    shapefile = shapefile.to_crs(ndvi_crs)

# Create the plot using GeoPandas and Matplotlib
fig, ax = plt.subplots(figsize=(10, 8))

# Show the NDVI using the rasterio 'show' function which ensures proper spatial alignment
im = show(ndvi, transform=red_band.transform, cmap='RdYlGn', vmin=0, vmax=1, ax=ax)

# Overlay the shapefile boundaries with red edges
shapefile.boundary.plot(ax=ax, edgecolor='red', linewidth=1)

# Add a color bar for NDVI
divider = make_axes_locatable(ax)
cax = divider.append_axes("right", size="5%", pad=0.05)
plt.colorbar(im.get_images()[0], cax=cax, label="NDVI Value")  # Use the color bar for NDVI values

# Add labels and center the title, using 'y' to adjust the title's vertical position
plt.suptitle("NDVI with Shapefile Boundaries - 08-06-2024 Tomato Farm", x=0.5, y=0.85, ha='center', fontsize=16)

# Turn off axis labels and ticks
ax.set_xticks([])
ax.set_yticks([])
ax.set_xlabel('')
ax.set_ylabel('')

# Show the plot
plt.show()

# File paths to the NDVI and shapefile
red_band_path = r"C:\Users\15302\Downloads\DrKisekka_Tomato\Data\08-06-2024_DrKisekka-Tomato_Farm_transparent_reflectance_red.tif"
nir_band_path = r"C:\Users\15302\Downloads\DrKisekka_Tomato\Data\08-06-2024_DrKisekka-Tomato_Farm_transparent_reflectance_nir.tif"
shapefile_path = r"C:\Users\15302\Downloads\DrKisekka_Tomato\SHP\DrKisekka_Tomato\Procedures\Shapefile\polygons_shapefile_Updated\polygons_shapefile_Updated.shp"

# Open and read the Red and NIR bands
with rasterio.open(red_band_path) as red_band:
    red_band_data = red_band.read(1)
    red_band_data = np.clip(red_band_data, 0, None)  # Replace negative values with 0
    ndvi_crs = red_band.crs  # Get the CRS of the NDVI data
    ndvi_transform = red_band.transform  # Get the transform of the NDVI

with rasterio.open(nir_band_path) as nir_band:
    nir_band_data = nir_band.read(1)
    nir_band_data = np.clip(nir_band_data, 0, None)  # Replace negative values with 0

# Calculate NDVI
ndvi = (nir_band_data - red_band_data) / (nir_band_data + red_band_data + 1e-10)
ndvi = np.clip(ndvi, -1, 1)  # Clip NDVI values to the range -1 to 1

# Read the shapefile with the T_rows
shapefile = gpd.read_file(shapefile_path)

# Reproject the shapefile to match the NDVI CRS if necessary
if shapefile.crs != ndvi_crs:
    shapefile = shapefile.to_crs(ndvi_crs)

# Create an empty list to hold the NDVI statistics
ndvi_stats = []

# Loop through each T_row in the shapefile
for _, row in shapefile.iterrows():
    # Get the geometry (polygon) for the current T_row
    geometry = row['geometry']
    
    # Create a mask of the NDVI data where the polygon is located
    mask = rasterio.features.geometry_mask([geometry], transform=ndvi_transform, invert=True, out_shape=ndvi.shape)
    
    # Apply the mask to the NDVI data to extract NDVI values for this polygon
    ndvi_values_in_polygon = ndvi[mask]
    
    # Calculate statistics for the current T_row
    min_ndvi = np.min(ndvi_values_in_polygon)
    max_ndvi = np.max(ndvi_values_in_polygon)
    avg_ndvi = np.mean(ndvi_values_in_polygon)
    median_ndvi = np.median(ndvi_values_in_polygon)
    
    # Append the statistics to the list
    ndvi_stats.append({
        'T_row': row['T_row'],
        'Min NDVI': min_ndvi,
        'Max NDVI': max_ndvi,
        'Avg NDVI': avg_ndvi,
        'Median NDVI': median_ndvi
    })

# Convert the list to a pandas DataFrame
ndvi_stats_df = pd.DataFrame(ndvi_stats)

# File path to save the CSV
csv_file_path = r"C:\Users\15302\Downloads\DrKisekka_Tomato\CSV\ndvi_statistics.csv"

# Save the DataFrame to a CSV file
ndvi_stats_df.to_csv(csv_file_path, index=False)

# Change pandas display options to show the entire DataFrame
pd.set_option('display.max_rows', None)  # Set the max rows to None to display all rows
pd.set_option('display.max_columns', None)  # Set the max columns to None to display all columns

# Display the DataFrame properly in Jupyter Notebook
from IPython.display import display
display(ndvi_stats_df)

# Set the style of seaborn to 'whitegrid' for better visibility of grid lines
sns.set(style="whitegrid")

# File paths
red_band_path = r"C:\Users\15302\Downloads\DrKisekka_Tomato\Data\08-06-2024_DrKisekka-Tomato_Farm_transparent_reflectance_red.tif"
nir_band_path = r"C:\Users\15302\Downloads\DrKisekka_Tomato\Data\08-06-2024_DrKisekka-Tomato_Farm_transparent_reflectance_nir.tif"
shapefile_path = r"C:\Users\15302\Downloads\DrKisekka_Tomato\SHP\DrKisekka_Tomato\Procedures\Shapefile\polygons_shapefile_Updated\polygons_shapefile_Updated.shp"

# Open and read the Red and NIR bands
with rasterio.open(red_band_path) as red_band:
    red_band_data = red_band.read(1)
    red_band_data = np.clip(red_band_data, 0, None)  # Remove negative values
    ndvi_crs = red_band.crs
    ndvi_transform = red_band.transform

with rasterio.open(nir_band_path) as nir_band:
    nir_band_data = nir_band.read(1)
    nir_band_data = np.clip(nir_band_data, 0, None)

# Calculate NDVI
ndvi = (nir_band_data - red_band_data) / (nir_band_data + red_band_data + 1e-10)
ndvi = np.clip(ndvi, -1, 1)

# Read and reproject the shapefile
shapefile = gpd.read_file(shapefile_path)
if shapefile.crs != ndvi_crs:
    shapefile = shapefile.to_crs(ndvi_crs)

# Extract NDVI values for each T_row
ndvi_distributions = {row: [] for row in range(1, 64)}
for _, row in shapefile.iterrows():
    geometry = row['geometry']
    mask = rasterio.features.geometry_mask([geometry], transform=ndvi_transform, invert=True, out_shape=ndvi.shape)
    ndvi_values_in_polygon = ndvi[mask]
    ndvi_distributions[row['T_row']].extend(ndvi_values_in_polygon)

# Convert to DataFrame for plotting
ndvi_df = pd.DataFrame({k: pd.Series(v) for k, v in ndvi_distributions.items()})
ndvi_df = ndvi_df.map(lambda x: x if x >= 0.6 else np.nan)

# Calculate medians
medians = ndvi_df.median()

# Categorize medians into 10 groups based on deciles
deciles = pd.qcut(medians, 10, labels=range(10))

# Assign colors based on decile group
color_palette = sns.color_palette("Greens", 10)
palette = {k: color_palette[int(deciles[k])] for k in medians.index}

# Create the box plot with custom palette
plt.figure(figsize=(15, 10))
sns.boxplot(data=ndvi_df, palette=palette, showfliers=False)  # 'showfliers=False' removes outliers
plt.title('NDVI Distribution for Each Tomato Row', fontsize=16)
plt.xlabel('Tomato Row', fontsize=14)
plt.ylabel('NDVI Value', fontsize=14)
plt.grid(True)
plt.xticks(rotation=90)  # Rotate x-axis labels for better readability
plt.show()

	T_row	Min NDVI	Max NDVI	Avg NDVI	Median NDVI
0	1	0.292895	0.905243	0.776103	0.819461
1	2	0.299648	0.898416	0.769655	0.811888
2	3	0.302086	0.907944	0.795964	0.833704
3	4	0.284377	0.900679	0.777486	0.821106
4	5	0.260260	0.915845	0.810768	0.845294
5	6	0.286055	0.911459	0.805762	0.846388
6	7	0.290043	0.920338	0.832236	0.863085
7	8	0.242104	0.918445	0.833681	0.867689
8	9	0.291374	0.922246	0.814388	0.857017
9	10	0.287791	0.918158	0.824628	0.858600
10	11	0.309191	0.928328	0.837097	0.863484
11	12	0.308985	0.922555	0.845657	0.868137
12	13	0.309867	0.922918	0.830907	0.865506
13	14	0.272548	0.919118	0.814245	0.860983
14	15	0.265358	0.920172	0.820680	0.859751
15	16	0.279018	0.920291	0.827180	0.866997
16	17	0.278705	0.923196	0.832440	0.867985
17	18	0.275244	0.920136	0.822076	0.863268
18	19	0.254523	0.925282	0.828712	0.862849
19	20	0.271349	0.926527	0.844255	0.875046
20	21	0.302372	0.926597	0.848634	0.874040
21	22	0.310630	0.926672	0.852433	0.872174
22	23	0.319968	0.927522	0.845638	0.867290
23	24	0.313875	0.924295	0.841506	0.865781
24	25	0.313341	0.927563	0.842997	0.867129
25	26	0.301069	0.925287	0.826853	0.857648
26	27	0.300625	0.921605	0.827905	0.856087
27	28	0.285682	0.920410	0.822871	0.852397
28	29	0.308498	0.928617	0.841434	0.868011
29	30	0.327414	0.927906	0.855061	0.868614
30	31	0.310697	0.929288	0.849257	0.869876
31	32	0.200529	0.929435	0.836590	0.865220
32	33	0.209777	0.929319	0.844068	0.875766
33	34	0.271624	0.927777	0.825709	0.874122
34	35	0.268834	0.924679	0.828465	0.870050
35	36	0.290278	0.924141	0.825285	0.868310
36	37	0.271050	0.925117	0.829413	0.870069
37	38	0.270766	0.928770	0.831307	0.875863
38	39	0.281253	0.931053	0.831510	0.872929
39	40	0.269756	0.925184	0.812203	0.868180
40	41	0.270368	0.930743	0.828853	0.879194
41	42	0.277699	0.931100	0.832026	0.878157
42	43	0.300043	0.931084	0.832301	0.876684
43	44	0.296767	0.927144	0.826428	0.869377
44	45	0.281539	0.925508	0.827935	0.862562
45	46	0.300527	0.927247	0.833627	0.870381
46	47	0.288258	0.918993	0.837981	0.870070
47	48	0.282135	0.918970	0.817023	0.863529
48	49	0.301140	0.924689	0.828211	0.873284
49	50	0.298126	0.922374	0.833571	0.874002
50	51	0.295354	0.922186	0.830210	0.867022
51	52	0.292280	0.917150	0.826106	0.862848
52	53	0.292428	0.917272	0.813567	0.851902
53	54	0.294261	0.918330	0.811446	0.852179
54	55	0.296700	0.916619	0.817921	0.856840
55	56	0.295247	0.916857	0.820908	0.860064
56	57	0.291777	0.920354	0.824784	0.861363
57	58	0.289915	0.915864	0.795514	0.853667
58	59	0.143817	0.912401	0.759962	0.827210
59	60	0.273048	0.913652	0.787233	0.834516
60	61	0.271906	0.906201	0.791029	0.831501
61	62	0.284361	0.913395	0.813106	0.854460
62	63	0.284828	0.904838	0.738986	0.831861

NDVI Calculation and Shapefile Processing from Drone Imagery¶

Import Required Libraries¶

Read and Display the Red Band¶

Read and Display the NIR Band¶

NDVI Calculation and Display¶

Read and Display Shapefile Metadata¶

Merge Polygons by T_row and Save the Updated Shapefile¶

NDVI Visualization with Shapefile Boundaries¶

Key Steps:¶

Calculate NDVI Statistics for Each Tomato Row¶

Visualize NDVI Distribution for Each Tomato Row¶

Contact Information¶