%matplotlib inline
import netCDF4
import matplotlib.pyplot as plt
# numpy 
import numpy as np
import dask
# xarray (very handy)
import xarray as xr
import rasterio
# http://geo.holoviews.org/index.html
import holoviews as hv
import geoviews as gv
import geoviews.feature as gf

import warnings
import sys
gv.extension('bokeh')


da = xr.DataArray([9, 0, 2, 1, 0])
da

<xarray.DataArray (dim_0: 5)>
array([9, 0, 2, 1, 0])
Dimensions without coordinates: dim_0

array([9, 0, 2, 1, 0])


da = xr.DataArray([9, 0, 2, 1, 0], dims=['x'])
da

<xarray.DataArray (x: 5)>
array([9, 0, 2, 1, 0])
Dimensions without coordinates: x

array([9, 0, 2, 1, 0])


da = xr.DataArray([9, 0, 2, 1, 0],
                  dims=['x'],
                  coords={'x': [10, 20, 30, 40, 50]})
da

<xarray.DataArray (x: 5)>
array([9, 0, 2, 1, 0])
Coordinates:
  * x        (x) int64 10 20 30 40 50

array([9, 0, 2, 1, 0])

array([10, 20, 30, 40, 50])


da.plot(marker='o')

[<matplotlib.lines.Line2D at 0x7fd601891f10>]


chla_ds = xr.open_dataset('https://www.oceancolour.org/thredds/dodsC/CCI_ALL-v5.0-5DAY?lat[1000:1:1550],lon[2350:1:2750],time[1450:1:1650],chlor_a[1450:1:1650][1000:1:1550][2350:1:2750]')
chla_ds

<xarray.Dataset>
Dimensions:  (lat: 551, lon: 401, time: 201)
Coordinates:
  * lat      (lat) float64 48.31 48.27 48.23 48.19 ... 25.52 25.48 25.44 25.4
  * lon      (lon) float64 -82.06 -82.02 -81.98 -81.94 ... -65.48 -65.44 -65.4
  * time     (time) datetime64[ns] 2017-06-25 2017-06-30 ... 2020-03-21
Data variables:
    chlor_a  (time, lat, lon) float32 ...
Attributes: (12/50)
    _NCProperties:                     version=1|netcdflibversion=4.4.1.1|hdf...
    Conventions:                       CF-1.7
    Metadata_Conventions:              Unidata Dataset Discovery v1.0
    cdm_data_type:                     Grid
    comment:                           See summary attribute
    creator_email:                     help@esa-oceancolour-cci.org
    ...                                ...
    time_coverage_resolution:          P5D
    time_coverage_duration:            P5D
    start_date:                        26-DEC-2020 00:00:00.000000
    stop_date:                         30-DEC-2020 23:59:00.000000
    time_coverage_start:               202012260000Z
    time_coverage_end:                 202012302359Z

array([48.3125  , 48.270833, 48.229167, ..., 25.479167, 25.4375  , 25.395833])

array([-82.0625  , -82.020833, -81.979167, ..., -65.479167, -65.4375  ,
       -65.395833])

array(['2017-06-25T00:00:00.000000000', '2017-06-30T00:00:00.000000000',
       '2017-07-05T00:00:00.000000000', ..., '2020-03-11T00:00:00.000000000',
       '2020-03-16T00:00:00.000000000', '2020-03-21T00:00:00.000000000'],
      dtype='datetime64[ns]')

[44411151 values with dtype=float32]


chla_ds = chla_ds.sel(lat=slice(44,26),lon=slice(-82,-66))
chla_ds

<xarray.Dataset>
Dimensions:  (lat: 432, lon: 384, time: 201)
Coordinates:
  * lat      (lat) float64 43.98 43.94 43.9 43.85 ... 26.15 26.1 26.06 26.02
  * lon      (lon) float64 -81.98 -81.94 -81.9 -81.85 ... -66.1 -66.06 -66.02
  * time     (time) datetime64[ns] 2017-06-25 2017-06-30 ... 2020-03-21
Data variables:
    chlor_a  (time, lat, lon) float32 ...
Attributes: (12/50)
    _NCProperties:                     version=1|netcdflibversion=4.4.1.1|hdf...
    Conventions:                       CF-1.7
    Metadata_Conventions:              Unidata Dataset Discovery v1.0
    cdm_data_type:                     Grid
    comment:                           See summary attribute
    creator_email:                     help@esa-oceancolour-cci.org
    ...                                ...
    time_coverage_resolution:          P5D
    time_coverage_duration:            P5D
    start_date:                        26-DEC-2020 00:00:00.000000
    stop_date:                         30-DEC-2020 23:59:00.000000
    time_coverage_start:               202012260000Z
    time_coverage_end:                 202012302359Z

array([43.979167, 43.9375  , 43.895833, ..., 26.104167, 26.0625  , 26.020833])

array([-81.979167, -81.9375  , -81.895833, ..., -66.104167, -66.0625  ,
       -66.020833])

array(['2017-06-25T00:00:00.000000000', '2017-06-30T00:00:00.000000000',
       '2017-07-05T00:00:00.000000000', ..., '2020-03-11T00:00:00.000000000',
       '2020-03-16T00:00:00.000000000', '2020-03-21T00:00:00.000000000'],
      dtype='datetime64[ns]')

[33343488 values with dtype=float32]


chla_ds.chlor_a.isel(time=1).plot()

<matplotlib.collections.QuadMesh at 0x7fd608afa820>


from matplotlib.colors import LogNorm
fig,ax = plt.subplots(figsize=(12,8))
chla_ds = chla_ds.sel(lat=slice(44,26),lon=slice(-82,-66))
chla_ds.chlor_a.isel(time=1).plot(ax=ax, cmap='jet', norm=LogNorm(vmin=0.01, vmax=10))
#ax.set_ylim(ax.get_ylim()[::-1])
plt.show()


chla_ds.chlor_a.isel(time=slice(30,50)).mean(dim=('lon', 'time')).plot()

[<matplotlib.lines.Line2D at 0x7fd6016b0880>]


chla_ds.chlor_a.isel(time=slice(30,50)).time

<xarray.DataArray 'time' (time: 20)>
array(['2017-11-22T00:00:00.000000000', '2017-11-27T00:00:00.000000000',
       '2017-12-02T00:00:00.000000000', '2017-12-07T00:00:00.000000000',
       '2017-12-12T00:00:00.000000000', '2017-12-17T00:00:00.000000000',
       '2017-12-22T00:00:00.000000000', '2017-12-27T00:00:00.000000000',
       '2018-01-01T00:00:00.000000000', '2018-01-06T00:00:00.000000000',
       '2018-01-11T00:00:00.000000000', '2018-01-16T00:00:00.000000000',
       '2018-01-21T00:00:00.000000000', '2018-01-26T00:00:00.000000000',
       '2018-01-31T00:00:00.000000000', '2018-02-05T00:00:00.000000000',
       '2018-02-10T00:00:00.000000000', '2018-02-15T00:00:00.000000000',
       '2018-02-20T00:00:00.000000000', '2018-02-25T00:00:00.000000000'],
      dtype='datetime64[ns]')
Coordinates:
  * time     (time) datetime64[ns] 2017-11-22 2017-11-27 ... 2018-02-25
Attributes:
    axis:           T
    standard_name:  time
    _ChunkSizes:    1

array(['2017-11-22T00:00:00.000000000', '2017-11-27T00:00:00.000000000',
       '2017-12-02T00:00:00.000000000', '2017-12-07T00:00:00.000000000',
       '2017-12-12T00:00:00.000000000', '2017-12-17T00:00:00.000000000',
       '2017-12-22T00:00:00.000000000', '2017-12-27T00:00:00.000000000',
       '2018-01-01T00:00:00.000000000', '2018-01-06T00:00:00.000000000',
       '2018-01-11T00:00:00.000000000', '2018-01-16T00:00:00.000000000',
       '2018-01-21T00:00:00.000000000', '2018-01-26T00:00:00.000000000',
       '2018-01-31T00:00:00.000000000', '2018-02-05T00:00:00.000000000',
       '2018-02-10T00:00:00.000000000', '2018-02-15T00:00:00.000000000',
       '2018-02-20T00:00:00.000000000', '2018-02-25T00:00:00.000000000'],
      dtype='datetime64[ns]')

array(['2017-11-22T00:00:00.000000000', '2017-11-27T00:00:00.000000000',
       '2017-12-02T00:00:00.000000000', '2017-12-07T00:00:00.000000000',
       '2017-12-12T00:00:00.000000000', '2017-12-17T00:00:00.000000000',
       '2017-12-22T00:00:00.000000000', '2017-12-27T00:00:00.000000000',
       '2018-01-01T00:00:00.000000000', '2018-01-06T00:00:00.000000000',
       '2018-01-11T00:00:00.000000000', '2018-01-16T00:00:00.000000000',
       '2018-01-21T00:00:00.000000000', '2018-01-26T00:00:00.000000000',
       '2018-01-31T00:00:00.000000000', '2018-02-05T00:00:00.000000000',
       '2018-02-10T00:00:00.000000000', '2018-02-15T00:00:00.000000000',
       '2018-02-20T00:00:00.000000000', '2018-02-25T00:00:00.000000000'],
      dtype='datetime64[ns]')


chla_ds.chlor_a.sel(lat=slice(35,34.5)).mean(dim=('lat'), skipna=True).plot( cmap='jet', norm=LogNorm(vmin=0.01, vmax=10))

<matplotlib.collections.QuadMesh at 0x7fd60166dd90>


import matplotlib.patches as patches
fig,ax = plt.subplots(figsize=(12,8))
chla_ds = chla_ds.sel(lat=slice(44,26),lon=slice(-82,-66))
chla_ds.chlor_a.isel(time=1).plot(ax=ax, cmap='jet', norm=LogNorm(vmin=0.01, vmax=10))
rect = patches.Rectangle((-71, 33), 1, 1, linewidth=1, edgecolor='black', facecolor='b', alpha=0.5)
ax.add_patch(rect)
rect = patches.Rectangle((-71, 39), 1, 1, linewidth=1, edgecolor='black', facecolor='g', alpha=0.5)
ax.add_patch(rect)
#ax.set_ylim(ax.get_ylim()[::-1])
plt.show()


fig,ax = plt.subplots()
chla_ds.chlor_a.sel(lat=slice(33,32), lon=slice(-71,-70)).mean(dim=('lat', 'lon')).plot(ax=ax, color='blue')
chla_ds.chlor_a.sel(lat=slice(39,38), lon=slice(-71,-70)).mean(dim=('lat', 'lon')).plot(ax=ax, color='green')
plt.show()


chla_ds_monthly = chla_ds.chlor_a.resample(time="1M").mean()

fig,ax = plt.subplots()
chla_ds_monthly.sel(lat=slice(33,32), lon=slice(-71,-70)).mean(dim=('lat', 'lon')).plot(ax=ax, color='blue')
chla_ds_monthly.sel(lat=slice(39,38), lon=slice(-71,-70)).mean(dim=('lat', 'lon')).plot(ax=ax, color='green')
plt.show()


import hvplot
import hvplot.pandas
import hvplot.xarray
import cartopy.crs as crs


proj = crs.Orthographic(-90, 30)

chla_ds.chlor_a.hvplot.quadmesh(
    'lon', 'lat', projection=proj, project=True,
    cmap='jet', dynamic=True, coastline='10m', 
    frame_width=500, logz=True, clim=(0.01,20), rasterize=True)


chla_ds.chlor_a.isel(time=slice(0,40)).mean(dim='time').hvplot(x="lon", y="lat", width=500, height=300, cmap='jet', logz=True, clim=(0.01,20), rasterize=True)


import geoviews.feature as gf

# the * operator allows you to add multiple datasets to the same plot
# you can also use the + operator to add multiple plots to the same overall figure
gf.ocean * \
gf.land * \
chla_ds.chlor_a.isel(time=slice(0,40)).mean(dim='time').hvplot(x="lon", y="lat", width=500, height=300, cmap='jet', logz=True, clim=(0.01,20), global_extent=True, projection=proj) *\
gf.coastline * \
gf.borders

Chapter 8: Use xarray to handle N-dimensional arrays and interactive plotting with geoviews¶

Simple xarray DataArrays¶

Working with our Ocean Color Dataset¶

Now that we have the data let's explore it a bit¶

let's just plot it normally selecting the first element in the time dimension¶

But a lot of the real power of xarray comes in when we have dense time series so let's look at all of our data.¶

caution this resample operation may take a fair amount of memory and is liable to crash if you're running on a Binder instance with low memory¶

Now let's bring in `hvplot` and see what it can do¶

Final Wrapup¶

Chapter 8: Use xarray to handle N-dimensional arrays and interactive plotting with geoviews¶

Simple xarray DataArrays¶

Working with our Ocean Color Dataset¶

Now that we have the data let's explore it a bit¶

let's just plot it normally selecting the first element in the time dimension¶

But a lot of the real power of xarray comes in when we have dense time series so let's look at all of our data.¶

caution this resample operation may take a fair amount of memory and is liable to crash if you're running on a Binder instance with low memory¶

Now let's bring in hvplot and see what it can do¶

Final Wrapup¶

Now let's bring in `hvplot` and see what it can do¶