import datacube
import matplotlib.pyplot as plt
import numpy as np
import geopandas
import rasterstats
import pandas as pd
import xarray as xr


dc = datacube.Datacube()


dc.list_products()


dc.list_measurements().loc['modis_nbar']


dc.list_measurements().loc['MOD10A1']


dc.list_products().loc[34,'description']


query = {'time': ['2020-01-01', '2020-01-01'],
         'measurements': ['snow_cover'],
         'output_crs': 'EPSG:4326',
         'resolution': [-0.0041666733029590754,0.0041666733029590754],
         'dask_chunks': {'time': -1, 'latitude': 782,'longitude': 1744}
}


# Loading the data
ds = dc.load(product='MOD10A1', **query)
print(ds)


# Select DataSet in time, in this case the fist satellite passage
ds = ds.isel(time=0)
print(ds)


(ds.snow_cover.values==250).sum()


(ds.snow_cover.values==250).sum()/ds.snow_cover.size


# Set NDSI limit to 0.4
ndsi_lim = 40
# Find pixels that have 0.4 <= NDSI <= 1 (snow pixels)
condition_snow_mask = (ds.snow_cover >= 40) & (ds.snow_cover <= 100)
# Assign the value of 150 to all these pixels
snow_mask = xr.where(condition_snow_mask, 150 , ds.snow_cover)

# Percentage of snow pixels
(snow_mask.values==150).sum()/ds.snow_cover.size


raion_gdf = geopandas.read_file("data/kgz_admbnda_adm2_moes_20181119.shp", encoding='utf-8')


fig, ax = plt.subplots(figsize=(25,10))
ds.snow_cover.plot(ax=ax, cmap='Blues_r')
raion_gdf.plot(ax=ax, facecolor='none', edgecolor='black', linewidth=2)


snow_mask = xr.where(condition_snow_mask, 1 , 0)


fig, ax = plt.subplots(figsize=(25,10))
snow_mask.plot(ax=ax, cmap='Blues_r')
raion_gdf.plot(ax=ax, facecolor='none', edgecolor='black', linewidth=2)


# Convert all the snow pixels to 150
snow_mask = xr.where(condition_snow_mask, 150 , ds.snow_cover)
# Convert all the no_snow pixels to 0 leaving the other numbers the same
snow_mask = xr.where(snow_mask < 40, 0 , snow_mask)

# Zonal statistic from rasterstats
results = rasterstats.zonal_stats(raion_gdf, snow_mask.values, affine=ds.snow_cover.affine, 
                                  nodata=255, stats='count', categorical=True)


df = pd.DataFrame(results)
df = df.fillna(0)
df


# Percentage of snow pixels
raion_gdf['snow_percentage'] = df[150.0]/df['count']
# Number of snow pixels
raion_gdf['n_snowpix'] = df[150.0]
raion_gdf


# set up the plot
fig, ax = plt.subplots(1, 1)
# set the size of the plot
fig.set_size_inches(18,10)

# plot with more attributes
raion_gdf.plot(column='snow_percentage', 
               ax=ax,
               cmap='Blues',
               vmin=0,
               vmax=1,
               edgecolor='black',
               legend=True, 
               legend_kwds={'label': "Percentage of Snow by Raion",
                            'orientation': "horizontal"})


# set up the plot
fig, ax = plt.subplots(1, 1)
# set the size of the plot
fig.set_size_inches(18,10)

# plot with more attributes
raion_gdf.plot(column='n_snowpix', 
               ax=ax,
               cmap='Blues',
               edgecolor='black',
               legend=True, 
               legend_kwds={'label': "Number of Snow pixels by Raion",
                            'orientation': "horizontal"})


# Loading again the Raion shapefiles
raion_gdf = geopandas.read_file("data/kgz_admbnda_adm2_moes_20181119.shp", encoding='utf-8')
raion_utm_gdf = raion_gdf.to_crs({'init': 'epsg:32643'})


start_date = '2019-12-01'
end_date = '2019-12-31'
query = {'time': ['2019-12-01', '2019-12-31'],
        'measurements': ['snow_cover'],
         'output_crs': 'EPSG:32643',
         'resolution': [-500, 500],
         'dask_chunks': {'time': 1}
}


# Loading and merging data for MODIS
terra = dc.load(product='MOD10A1', **query)
aqua = dc.load(product='MYD10A1', **query)
data = xr.concat([aqua,terra], dim='time')
crs = data.crs
print(data)


# Find pixels that have 0.4 <= NDSI <= 1 (snow pixels)
condition = (data.snow_cover >= 40) & (data.snow_cover <= 100)
snow_cover = xr.where(condition, 1, 0)

# Find pixels that could not be classified (clouds included)
nodata = (data.snow_cover >= 250) | (data.snow_cover == 200) | (data.snow_cover == 201)
snow_cover = xr.where(nodata, np.nan, snow_cover)

# All the rasters will have 1 for snow, 0 for no_snow and NaN for no_data)
print(snow_cover)


# Dimensions of the Data Array
snow_cover.shape


# Find the max values of snow_cover for each day. It will include all the snow pixels.
snow_cover = snow_cover.groupby('time.day').max()
print(snow_cover)


# Dimensions of the Data Array
snow_cover.shape


# Saving all the nodata values
nodata = snow_cover.isnull()
# Keep memory of pixel that always nodata night cloud
mask_nan = ( nodata.sum(dim='day')/snow_cover.day.size ) == 1

# Initialise the xarrays
snow_persistence = xr.where(snow_cover.isel(day=0) != -1, 0, 1)
snow_persistence_max = snow_persistence.copy()

# For loop to find the snow persistence
for i in range(snow_cover.day.size):
    # For nodata night and cloud conditions use the existing values
    # otherwise calculate the new value
    snow_persistence = xr.where(nodata.isel(day=i),
                                snow_persistence,
                                (snow_persistence + snow_cover.isel(day=i)) * snow_cover.isel(day=i))
    snow_persistence_max = xr.ufuncs.fmax(snow_persistence, snow_persistence_max)

# Keep the NaN values
snow_persistence_max = xr.where(mask_nan, np.nan , snow_persistence_max).compute()


# Plot the max snow persistence observed in the choosen time period
snow_persistence_max.name = 'snow_persistence_max'
fig, ax = plt.subplots(figsize=(25,10))
snow_persistence_max.plot.imshow(ax=ax)
raion_utm_gdf.plot(ax=ax, facecolor='none', edgecolor='black', linewidth=2)


# To compute the percentage that a pixel has been a snow pixel, we need to remove the case 
# when it has been detected as a nodata, night or cloud.

snow_count_valid = xr.where(nodata, 1 , 0)
snow_count_sum = snow_count_valid.sum(axis=0)
print(snow_count_sum)


# Plot the number of occurrencies per pixel, at the edge should be equal to snow_cover.time.size
snow_count_sum.name = 'number of occurrencies for nodata'
fig, ax = plt.subplots(figsize=(25,10))
snow_count_sum.plot.imshow(ax=ax)
raion_utm_gdf.plot(ax=ax, facecolor='none', edgecolor='black', lw=2)


# Compute the percentage that a pixel has been a snow pixel
snow_percentage = snow_cover.sum(dim='day')/(snow_cover.day.size - snow_count_sum) *100.


# Plot the snow percentage in the chosen time period
snow_percentage.name = 'snow_percentage'
fig, ax = plt.subplots(figsize=(25,10))
snow_percentage.plot.imshow(ax=ax, vmax = 100., vmin=0.)
raion_utm_gdf.plot(ax=ax, facecolor='none', edgecolor='black', lw=2)

More Advanced Data Cube Usage¶

Introduction to MODIS products and Snow Map¶

Now let's find the Snow Mask for the data in the Data Cube!¶

Plotting our Snow Mask¶

Snow Persistence and Snow Percentage¶