import datetime
import sys
import geopandas
import numpy as np
import xarray as xr
import matplotlib.pyplot as plt
from datacube import Datacube
from rasterio.features import geometry_mask
sys.path.append('/eOsphere/bin')
import dcFunctions


dc = Datacube()


sf = geopandas.read_file('data/kgz_admbnda_adm2_moes_20181119.shp', encoding='utf-8')
sf


# Select a Raion
region_id = 15 
# Get the coordinate of the box of the Raion selected
minX, minY, maxX, maxY = sf.bounds.loc[region_id]


start_date, end_date = '2019-06-21','2019-06-30'
query = {'x': [minX,maxX],
             'y': [minY,maxY],
             'time': [start_date, end_date],
             'measurements': ['ndvi'],
             'output_crs': 'EPSG:32643',
             'resolution': [10,10],
             'dask_chunks': {'time': 1, 'x': 1024, 'y': 1024}
        }


ds = dc.load(product='indices', **query)
crs = ds.crs
shape_ds = ds.geobox.shape
affine_ds = ds.geobox.affine


print(ds)
ds = ds.isel(time=0)
ds = dcFunctions.scal_2_tru(ds)


sf_utm = sf.to_crs(epsg=32643)


fig, ax = plt.subplots()
ds.ndvi.plot(ax=ax, cmap='RdYlGn')
sf_utm.plot(ax=ax, facecolor='none', edgecolor='black')


# This is just to make sure that we are using the same projection of the data
gdf = sf.iloc[[region_id]].to_crs(crs)

# Create a mask from the shapefile
mask = geometry_mask(
            gdf.geometry,
            out_shape = shape_ds,
            transform = affine_ds,
            all_touched = False,
            invert = False)
mask = xr.DataArray(mask, dims=('y', 'x'))
ds = ds.where(~mask)


fig, ax = plt.subplots()
ds.ndvi.plot(ax=ax, cmap='RdYlGn')
sf_utm.plot(ax=ax, facecolor='none', edgecolor='black')


fig, ax = plt.subplots()
ds.ndvi.plot(ax=ax, cmap='RdYlGn')
gdf.plot(ax=ax, facecolor='none', edgecolor='black')


# Load the shapefile and find the bounds
sf = geopandas.read_file('data/kgz_admbnda_adm2_moes_20181119.shp')
minX, minY = sf.bounds['minx'].min(), sf.bounds['miny'].min()
maxX, maxY = sf.bounds['maxx'].max(), sf.bounds['maxy'].max()


# Query to load MODIS data
start_date, end_date = '2019-06-21','2019-06-30'
query = {'x': [minX,maxX],
             'y': [minY,maxY],
             'time': [start_date, end_date],
             'measurements': ['red','green','blue'],
             'output_crs': 'EPSG:32643',
             'resolution': [-500,500],
             'dask_chunks': {'time': 1, 'x': 1024, 'y': 1024}
        }


ds = dc.load(product='modis_nbar', **query)

# Save some parameters for later on
crs = ds.crs
shape_ds = ds.geobox.shape
affine_ds = ds.geobox.affine
print(ds)


# Remove nodata value
ds = ds.where(ds!=32767)

# Compute the median for the 3 channels/bands
ds = ds.median(dim='time').compute()
# Apply a correction (for the colours)
ds = ds**0.5
print(ds)


fig, ax = plt.subplots(figsize = (15,7))
ds[['red','green','blue']].to_array().plot.imshow(ax=ax, robust=True)
sf_utm.plot(ax=ax, facecolor='none', edgecolor='red')


# List all the raions that you want
region_ids = [15, 33]
mask = np.ones(shape_ds, dtype=bool)
for region in region_ids:
    # This is just to make sure that we are using the same projection of the data
    gdf = sf.iloc[[region]].to_crs(crs)

    # Create a mask from the shape file
    temp = geometry_mask(
            gdf.geometry,
            out_shape = shape_ds,
            transform = affine_ds,
            all_touched = False,
            invert = False)
    mask = mask & temp
    
mask = xr.DataArray(mask, dims=('y', 'x'))
# Cropping our image
ds = ds.where(~mask)


fig, ax = plt.subplots(figsize = (15,7))
ds[['red','green','blue']].to_array().plot.imshow(ax=ax, robust=True)
sf_utm.plot(ax=ax, facecolor='none', edgecolor='red')


dc.list_measurements().loc['rgb']


# Select a raion
sf = geopandas.read_file('data/kgz_admbnda_adm2_moes_20181119.shp')
region_id = 15
minX, minY, maxX, maxY = sf.bounds.loc[region_id]


start_date, end_date = '2019-06-01','2019-06-30'
query = {'x': [minX,maxX],
             'y': [minY,maxY],
             'time': [start_date, end_date],
             'measurements': ['red','green','blue'],
             'output_crs': 'EPSG:32643',
             'resolution': [10,10],
             'dask_chunks': {'time': 1, 'x': 1024, 'y': 1024}
        }


ds = dc.load(product='rgb', **query)
print(ds)
crs = ds.crs
gdf = sf.iloc[[region_id]].to_crs(crs)


ds = ds.isel(time=0)
ds = dcFunctions.scal_2_tru(ds)
print(ds)


fig, ax = plt.subplots(figsize = (15,7))
ds[['red','green','blue']].to_array().plot.imshow(ax=ax, robust=True)
gdf.plot(ax=ax, facecolor='none', edgecolor='red')


import sys
import datacube
import numpy as np
import matplotlib.pyplot as plt
sys.path.append('/eOsphere/bin')
import dcFunctions


dc = datacube.Datacube()

query = {'x': [74.386, 74.391],
         'y': [42.9, 42.91],
         'measurements': ['red', 'nir', 'mask'],
         'output_crs': 'EPSG:32643',
         'resolution': [10, 10]
        }


ds = dc.load(product='s2_10m', **query)
ds = ds.sortby('time')
print(ds)


ds = ds.where((ds.mask == 5) | (ds.mask == 7))


ds = ds.median(['x', 'y'])
print(ds)


msavi = ((2 * ds.nir) + 1 - ((2 * ds.nir + 1)**2 - 8 * (ds.nir - ds.red))**0.5) / 2


plt.scatter(ds.time, msavi, marker='.')


query = {'x': [73.7128139, 77.9073308],
         'y': [40.2809711, 42.4530034],
         'time': ['2019-01-01', '2019-12-31'],
         'measurements': ['ndvi', 'ndwi'],
         'output_crs': 'EPSG:32643',
         'resolution': [100, 100]
        }


ds = dc.load(product='month_indices', **query)
print(ds)


ds = dcFunctions.scal_2_tru(ds)


ds = ds.median(['y','x'])
print(ds)


fig, ax = plt.subplots(1, 1, figsize=[8,5])

ds['ndvi'].plot.line(ax=ax, label='NDVI')
ds['ndwi'].plot.line(ax=ax, label='NDWI')
plt.legend(loc='upper left')
plt.show()

More Advanced Data Cube Usage¶

Introduction to cropping products with shapefiles¶

Let's look at the NDVI for this raion¶

Let's cut the image using the shape file¶

Multiple polygons¶

More Advanced Data Cube Usage¶

Timeseries Analysis¶

Finding average index values in Naryn for 2019¶