# Ignore warnings 
import warnings
warnings.simplefilter('ignore')

# Load Data Cube Configuration
import datacube
dc = datacube.Datacube()

# Import Utilities
from datacube.utils import masking
from dea_tools.plotting import rgb, display_map
import numpy as np
import xarray as xr
import pandas as pd
import matplotlib.pyplot as plt

### EASI tools
import sys, os
sys.path.append(os.path.expanduser('/home/jovyan/hub-notebooks/scripts'))
os.environ['USE_PYGEOS'] = '0'
from easi_tools import EasiNotebooks
import notebook_utils
easi = EasiNotebooks()


# Select a Product and Platform
product = "s1_rtc"


# MODIFY HERE

# Select the center of an analysis region (lat_long) 
# Adjust the surrounding box size (box_size) around the center (in degrees)

# Camp Fire, Paradise, CA
# Time = 2018-10-01, 2018-11-30
# Fire started 11-08, contained 11-25
# Data Filter > Orbit=137

# lat_long = (39.76, -121.550)
# box_size_deg = 0.25
# time_extents = ('2018-10-01', '2018-12-31')

# Lake Berryessa, Napa, CA
# Time = 2020-07-01, 2020-09-01
# Fire started 08-16-20
# Data Filter > Orbit=35

# lat_long = (38.5, -122.228)
# box_size_deg = 0.10
# time_extents = ('2020-07-01', '2020-09-01')

# Sample Fire Region from Jack
# Time = 2020-02-04
# Data Filter > Orbit=147

# lat_long = (-35.625, 148.920)
# box_size_deg = 0.40
time_extents = ('2019-01-01', '2019-03-01')


# Calculate the latitude and longitude bounds of the analysis box
# latitude = (lat_long[0]-box_size_deg/2, lat_long[0]+box_size_deg/2)
# longitude = (lat_long[1]-box_size_deg/2, lat_long[1]+box_size_deg/2)
latitude = easi.latitude
longitude = easi.longitude


display_map(longitude,latitude)


parameters = dict(product=product, measurements=['vv','vh'],
                  time=time_extents, lat=latitude, lon=longitude, group_by='time',
                 )
                  # query={'filter':'relativeOrbitNumber_start=147'})


sar_dataset = dc.load(**parameters)
sar_dataset


from operator import itemgetter

def get_metadata(group):
    metadata = (set(), set(), set(), set())
    for ds in group:
        metadata[0].add(np.datetime64(ds.metadata_doc.get('properties').get('dtr:start_datetime'), 'D'))
        metadata[1].add(ds.metadata_doc.get('properties').get('sentinel:orbit'))
        metadata[2].add(ds.metadata_doc.get('properties').get('eo:platform'))
        metadata[3].add(ds.metadata_doc.get('properties').get('sentinel:datatake_id'))
    return tuple(map(lambda x: ', '.join([str(i) for i in x]), metadata))

parameters.update(group_by='time' if not parameters.get('group_by') else parameters['group_by'])
sar_metadata = sorted([get_metadata(groups)
                       for groups in dc.group_datasets(dc.find_datasets(**parameters),
                                                       parameters.get('group_by')).values],key=itemgetter(0))


# Show acquisition indices and dates
pd.set_option('display.max_rows', 250)
pd.DataFrame(sar_metadata, columns=['Acquisition Date', 'Orbit', 'Platform', 'ID'])


# Setup dB to power conversion functions so that filters work on power values

def to_pwr(x):
    return 10**(x/10)
def to_db(x):
    return 10*np.log10(x)


# MODIFY HERE

# Users can select the "filter_size" to define the level of speckle filtering. The baseline is 5.
# The filter size must be an odd number, such as 3,5,7, etc. 

from ceos_utils.data_cube_utilities.raster_filter import stats_filter_2d

# Set any null values to 0 before applying the filter to prevent issues
sar_dataset_filled = sar_dataset.where(~sar_dataset.isnull(), 0)

# Create a new entry in dataset corresponding to filtered VV and VH data
sar_dataset["block_filter_vv"] = sar_dataset_filled.vv.pipe(to_pwr).groupby("time")\
                                 .apply(stats_filter_2d, statistic='mean', filter_size=5)\
                                 .pipe(to_db)
sar_dataset["block_filter_vh"] = sar_dataset_filled.vh.pipe(to_pwr).groupby("time")\
                                 .apply(stats_filter_2d, statistic='mean', filter_size=5)\
                                 .pipe(to_db)


# MODIFY HERE

# Choose a single time slice by its index (listed above)
acq_ind_to_show = 2


fig = plt.figure(figsize=(15, 5))
sar_dataset.isel(time=acq_ind_to_show).block_filter_vv.plot.hist(bins=1000, range=(-5,0), 
                                                                 label="VV Block Filter")
sar_dataset.isel(time=acq_ind_to_show).block_filter_vh.plot.hist(bins=1000, range=(-5,0), 
                                                                 label="VH Block Filter", alpha=0.5)
plt.legend()
plt.xlabel("Backscatter Intensity (dB)")
plt.ylabel("Number of Pixels")
plt.title("Histogram Comparison of Block-Filtered VV and VH Backscatter")
plt.show()


# This backscatter scaling is optimized for block-filtered data
# VV band range is 0dB to -16dB which is DN=1.00 to DN=0.158
# VH band range is -5dB to -27dB which is DN=0.562 to DN=0.045
# VV/VH range is 0.0 to 1.0. This data is scaled by 20 for improved color contrast

vv_convert = (10**(sar_dataset.block_filter_vv/20)-0.158)*303
vh_convert = (10**(sar_dataset.block_filter_vh/20)-0.045)*493
sar_dataset['vv_amp'] = vv_convert
sar_dataset['vh_amp'] = vh_convert
sar_dataset['vvvh_amp'] = (vv_convert / vh_convert) * 20
sar_dataset['vvvh'] = (sar_dataset.vv / sar_dataset.vh) * 20


# Plots of VV and VH Backscatter Intensity
fig, ax = plt.subplots(1, 2, figsize=(16, 8))
sar_dataset['r1'] = sar_dataset.vv
sar_dataset['b1'] = sar_dataset.vv
sar_dataset['g1'] = sar_dataset.vv
rgb(sar_dataset.isel(time=acq_ind_to_show), ax=ax[0], bands=['r1','g1','b1'])
sar_dataset['r2'] = sar_dataset.vh
sar_dataset['b2'] = sar_dataset.vh
sar_dataset['g2'] = sar_dataset.vh
rgb(sar_dataset.isel(time=acq_ind_to_show), ax=ax[1], bands=['r2','g2','b2'])
ax[0].set_title('VV Backscatter'), ax[0].xaxis.set_visible(False), ax[0].yaxis.set_visible(False)
ax[1].set_title('VH Backscatter'), ax[1].xaxis.set_visible(False), ax[1].yaxis.set_visible(False)
plt.show()


# RGB Plot of Backscatter Intensity (RGB= VV, VH, VV/VH)
# High backscatter (both bands) due to vegetation and foliage will appear as YELLOW (mix of red and green)
# New vegetation and urban areas are MAGENTA in color (due to high overall scattering and higher VV compared to VH)
# Low vegetation areas are BLUE (due to low overall scattering and higher VV compared to VH)
# Water is BLACK (low backscatter in both bands with similar VV and VH)

rgb(sar_dataset.isel(time=acq_ind_to_show),bands=['vv_amp','vh_amp','vvvh_amp'], size=10, robust=True)
plt.title('Backscatter RGB: VV, VH, VV/VH')
plt.axis('off')
plt.show()


# Define a custom RGB - This custom RGB allows specific bands and time slices to be assigned to each color
# This custom RGB can be valuable for viewing land changes between two time periods

def custom_rgb(dataset, rgb_to_data_arr_ind_map, **rgb_kwargs):
    rgb_data = {}
    for channel, [data_var, time_ind] in zip(['nbart_red', 'nbart_green', 'nbart_blue'], rgb_to_data_arr_ind_map):
        rgb_data[channel] = dataset[data_var].isel(time=time_ind)
        rgb_data[channel] = rgb_data[channel].drop('time').to_array()
    rgb_data = xr.Dataset(rgb_data).squeeze('variable')
    rgb_kwargs['ds'] = rgb_data
    rgb(**rgb_kwargs)
    return fig, ax


# MODIFY HERE

# Define a custom RGB image using multiple dates and bands
# This product can be useful to view land change between different time periods

# Select the band: 'vv_amp' or 'vh_amp'
band = ['vh_amp']

# Selent the scene index for each color: Red, Green, Blue
first_scene = 0   # This is the RED color
second_scene = 2  # This is the GREEN color
third_scene = 3   # This is the BLUE color

# Color Interpretation for output results
# Red areas have high vegetation (cropping) at the early date
# Green areas have high vegetation (cropping) at the middle date
# Blue areas have high vegetation (cropping) at the later date
# Cyan (mix of green and blue) have higher vegetation in 2nd and 3rd dates compared to 1st date
# Magenta (mix of red and blue) have higher vegetation in 1st and 3rd dates compared to 2nd date
# Yellow (mix of red and green) have higher vegetation in 1st and 2nd dates compared to 3rd date
# Grey regions are high scattering (all dates) due to tree foliage or grass vegetation
# Black regions are low scattering (all dates) due to water or low vegetation (bare soils)

rgb_to_data_arr_ind_map = [[band,first_scene],[band,second_scene],[band,third_scene]]
custom_rgb(sar_dataset, rgb_to_data_arr_ind_map, size=10)
plt.title('Multi-Date RGB Backscatter Product')
plt.axis('off')
plt.show()


# MODIFY HERE

# Select TWO acquisitions to calculate a change product
# Choose from the indices in the table above
# first_acq_ind = First time slice acquisition
# second_acq_ind = Second time slice acquisition

first_acq_ind = 1
second_acq_ind = 3

# Select the variable to plot: vv or vh

threshold_variable = 'block_filter_vh'

# The code will calculate the difference of the two images (Second-First)
# Define a threshold range to compare the difference of the two acquisitions
# GREY = Pixels NOT in the threshold range 
# RED = Pixels LESS than the low end of the threshold range
# GREEN = Pixels MORE than the high end of the threshold range

threshold_range = (-4, 8)


# Set the overlay colors
# Calculate the difference in backscatter between the two times
# Find the pixels above or below the threshold range (these are significant changes)

color_loss = np.array([255,0,0]) # backscatter decrease (RED)
color_gain = np.array([0,255,0]) # backscatter increase (GREEN)
color_black = np.array([0,0,0]) # low backscatter change, water (BLACK)

first_acq = sar_dataset.isel(time=first_acq_ind)
second_acq = sar_dataset.isel(time=second_acq_ind)
change_product = second_acq[threshold_variable] - first_acq[threshold_variable]

below_th = change_product.values < threshold_range[0]
above_th = threshold_range[1] < change_product.values


# Set the water threshold value based on data in the histograms for the selected band
# This will "mask" the water pixels and not show false change

water = first_acq[threshold_variable].values < -21.0


# Create a custom threshold plot to identify land change
# The background image VV backscatter (grey-scale)
# RED areas have decreased backscatter or a loss of vegetation
# GREEN areas have increased backscatter or an increase in vegetation
# BLACK areas have no significant backscatter change or are water

first_acq['red'] = first_acq.block_filter_vh
first_acq['green'] = first_acq.block_filter_vh
first_acq['blue'] = first_acq.block_filter_vh

rgb(first_acq, bands=['red', 'green', 'blue'], size=10)
    # paint_on_mask=[(below_th, color_loss),(above_th, color_gain),(water, color_black)])
plt.title('Multi-Date Single-Band Threshold Land Change Product')
plt.axis('off')
plt.show()

Sentinel-1 Land Change Notebook¶

Instructions for Execution¶

Load the Data Cube Configuration and Import Utilities¶

Define the Extents of the Analysis and View¶

Define Filtering, Load the Data and View the Available Dates¶

Speckle Filtering using a Block Filter¶

View Histogram Plots¶

Scale the backscatter amplitude for better image outputs¶

VV, VH and RGB images¶

Multi-Date RGB Land Change Product¶

Multi-Date Single-Band Threshold Land Change Product¶