import xarray as xr
import numpy as np
import matplotlib.pyplot as plt
import cartopy.crs as ccrs
import cartopy.feature as cfeature
import pandas as pd
import s3fs
import metpy
from importlib.metadata import version
import warnings #dont print warnings
warnings.filterwarnings('ignore')

date = '20210214'
hour = '12'
var = 'TMP'
level = '2m_above_ground'
url1 = 's3://hrrrzarr/sfc/' + date + '/' + date + '_' + hour + 'z_anl.zarr/' + level + '/' + var + '/' + level
url2 = 's3://hrrrzarr/sfc/' + date + '/' + date + '_' + hour + 'z_anl.zarr/' + level + '/' + var

package = "zarr"
package_version = version(package)
major_version = int(package_version.split(".")[0])  # Extract the major version

if major_version == 3:      
    import zarr
    # strip leading 's3://' from url
    url1_3 = url1[5:]
    url2_3 = url2[5:]
    fs = s3fs.S3FileSystem(anon=True, asynchronous=True)
    file1 = zarr.storage.FsspecStore(fs, path=url1_3)
    file2 = zarr.storage.FsspecStore(fs, path=url2_3)
else:
    fs = s3fs.S3FileSystem(anon=True, asynchronous=False)
    file1 = s3fs.S3Map(url1, s3=fs)
    file2 = s3fs.S3Map(url2, s3=fs)

ds = xr.open_mfdataset([file1,file2], engine='zarr')

ds

<xarray.Dataset> Size: 4MB
Dimensions:                  (projection_y_coordinate: 1059,
                              projection_x_coordinate: 1799)
Coordinates:
  * projection_y_coordinate  (projection_y_coordinate) float64 8kB -1.587e+06...
  * projection_x_coordinate  (projection_x_coordinate) float64 14kB -2.698e+0...
Data variables:
    TMP                      (projection_y_coordinate, projection_x_coordinate) float16 4MB dask.array<chunksize=(150, 150), meta=np.ndarray>
    forecast_period          timedelta64[ns] 8B ...
    forecast_reference_time  datetime64[ns] 8B ...
    height                   float64 8B ...
    pressure                 float64 8B ...
    time                     datetime64[ns] 8B ...

array([-1587306.152557, -1584306.152557, -1581306.152557, ...,  1580693.847443,
        1583693.847443,  1586693.847443], shape=(1059,))

array([-2697520.142522, -2694520.142522, -2691520.142522, ...,  2690479.857478,
        2693479.857478,  2696479.857478], shape=(1799,))

[1 values with dtype=timedelta64[ns]]

[1 values with dtype=datetime64[ns]]

[1 values with dtype=float64]

[1 values with dtype=float64]

[1 values with dtype=datetime64[ns]]

HRRR_proj = pd.read_json ("https://hrrrzarr.s3.amazonaws.com/grid/projparams.json", orient="index")
HRRR_proj

lat_0 = HRRR_proj.loc['lat_0'].astype('float32').squeeze()
lat_1 = HRRR_proj.loc['lat_1'].astype('float32').squeeze()
lat_2 = HRRR_proj.loc['lat_2'].astype('float32').squeeze()
lon_0 = HRRR_proj.loc['lon_0'].astype('float32').squeeze()
a = HRRR_proj.loc['a'].astype('float32').squeeze()
b = HRRR_proj.loc['b'].astype('float32').squeeze()

projData= ccrs.LambertConformal(central_longitude=lon_0, central_latitude=lat_0,
                                standard_parallels=[lat_1,lat_2],
                                globe=ccrs.Globe(semimajor_axis=a, semiminor_axis=b))

ds.coords

Coordinates:
  * projection_y_coordinate  (projection_y_coordinate) float64 8kB -1.587e+06...
  * projection_x_coordinate  (projection_x_coordinate) float64 14kB -2.698e+0...

airTemp = ds.TMP

airTemp

<xarray.DataArray 'TMP' (projection_y_coordinate: 1059,
                         projection_x_coordinate: 1799)> Size: 4MB
dask.array<open_dataset-TMP, shape=(1059, 1799), dtype=float16, chunksize=(150, 150), chunktype=numpy.ndarray>
Coordinates:
  * projection_y_coordinate  (projection_y_coordinate) float64 8kB -1.587e+06...
  * projection_x_coordinate  (projection_x_coordinate) float64 14kB -2.698e+0...
Attributes:
    GRIB_PARAM:  [2, 0, 0, 0]
    long_name:   2m_above_ground/TMP
    units:       K

array([-1587306.152557, -1584306.152557, -1581306.152557, ...,  1580693.847443,
        1583693.847443,  1586693.847443], shape=(1059,))

array([-2697520.142522, -2694520.142522, -2691520.142522, ...,  2690479.857478,
        2693479.857478,  2696479.857478], shape=(1799,))

airTemp = airTemp.metpy.convert_units('degC')

airTemp

<xarray.DataArray 'TMP' (projection_y_coordinate: 1059,
                         projection_x_coordinate: 1799)> Size: 4MB
<Quantity(dask.array<truediv, shape=(1059, 1799), dtype=float16, chunksize=(150, 150), chunktype=numpy.ndarray>, 'degree_Celsius')>
Coordinates:
  * projection_y_coordinate  (projection_y_coordinate) float64 8kB -1.587e+06...
  * projection_x_coordinate  (projection_x_coordinate) float64 14kB -2.698e+0...
Attributes:
    GRIB_PARAM:  [2, 0, 0, 0]
    long_name:   2m_above_ground/TMP

array([-1587306.152557, -1584306.152557, -1581306.152557, ...,  1580693.847443,
        1583693.847443,  1586693.847443], shape=(1059,))

array([-2697520.142522, -2694520.142522, -2691520.142522, ...,  2690479.857478,
        2693479.857478,  2696479.857478], shape=(1799,))

x = airTemp.projection_x_coordinate
y = airTemp.projection_y_coordinate

airTemp.plot(figsize=(11,8.5))

<matplotlib.collections.QuadMesh at 0x7f8e55e44110>

airTemp.min()

<xarray.DataArray 'TMP' ()> Size: 2B
<Quantity(dask.array<_nanmin_skip-aggregate, shape=(), dtype=float16, chunksize=(), chunktype=numpy.ndarray>, 'degree_Celsius')>
Attributes:
    GRIB_PARAM:  [2, 0, 0, 0]
    long_name:   2m_above_ground/TMP

minTemp = airTemp.min().compute()
maxTemp = airTemp.max().compute()

minTemp.values, maxTemp.values

(array(-42.38, dtype=float16), array(26., dtype=float16))

fint = np.arange(np.floor(minTemp.values),np.ceil(maxTemp.values) + 2, 2)

fint

array([-43., -41., -39., -37., -35., -33., -31., -29., -27., -25., -23.,
       -21., -19., -17., -15., -13., -11.,  -9.,  -7.,  -5.,  -3.,  -1.,
         1.,   3.,   5.,   7.,   9.,  11.,  13.,  15.,  17.,  19.,  21.,
        23.,  25.,  27.])

latN = 50.4
latS = 24.25
lonW = -123.8
lonE = -71.2

res = '50m'

fig = plt.figure(figsize=(18,12))
ax = fig.add_subplot(1,1,1,projection=projData)
ax.set_extent ([lonW,lonE,latS,latN],crs=ccrs.PlateCarree())
ax.add_feature(cfeature.COASTLINE.with_scale(res))
ax.add_feature(cfeature.STATES.with_scale(res))

# Add the title
tl1 = 'HRRR 2m temperature (°C)'
tl2 = f'Analysis valid at: {hour}00 UTC {date}'  
ax.set_title(f'{tl1}\n{tl2}',fontsize=16)
# Contour fill
CF = ax.contourf(x,y,airTemp,levels=fint,cmap=plt.get_cmap('coolwarm'))
# Make a colorbar for the ContourSet returned by the contourf call.
cbar = fig.colorbar(CF,shrink=0.5)
cbar.set_label(f'2m Temperature (°C)', size='large')

	0
a	6371229
b	6371229
proj	lcc
lon_0	262.5
lat_0	38.5
lat_1	38.5
lat_2	38.5

Lesson 2. Visualize NCEP's High-Resolution Rapid Refresh (HRRR) Temperature Data using `zarr`¶

What is Zarr?¶

How is data stored in Zarr?¶

Data Organization¶

Step 1. Load the necessary libraries¶

Step 2. Access archived NCEP HRRR data hosted on AWS in `Zarr` format¶

Sidetrip: The `Dask` library¶

Step 3. Visualize 2m temperatures at a given point in time¶

Step 4. Plot a map of temperatures¶

Conclusions¶

Additional Resources¶

Lesson 2. Visualize NCEP's High-Resolution Rapid Refresh (HRRR) Temperature Data using zarr¶

What is Zarr?¶

How is data stored in Zarr?¶

Data Organization¶

Step 1. Load the necessary libraries¶

Step 2. Access archived NCEP HRRR data hosted on AWS in Zarr format¶

Sidetrip: The Dask library¶

Step 3. Visualize 2m temperatures at a given point in time¶

Step 4. Plot a map of temperatures¶

Conclusions¶

Additional Resources¶

Lesson 2. Visualize NCEP's High-Resolution Rapid Refresh (HRRR) Temperature Data using `zarr`¶

Step 2. Access archived NCEP HRRR data hosted on AWS in `Zarr` format¶

Sidetrip: The `Dask` library¶