合并具有相同范围但不同空间分辨率的xarray数据集

import netCDF4 import numpy as np import dask import xarray as xr rainy_bbox = np.array([ [-69.29519955115512,-13.861261028444734], [-69.29519955115512,-12.384786628185896], [-71.19583431678012,-12.384786628185896], [-71.19583431678012,-13.861261028444734]]) max_lon_lat = np.max(rainy_bbox, axis=0) min_lon_lat = np.min(rainy_bbox, axis=0) # this dataset is available here: ftp://fluo.gps.caltech.edu/data/tropomi/gridded/ sif = xr.open_dataset('../data/TROPO_SIF_03-2018.nc') # the dataset is global so subset to my study area in the Amazon rainy_sif_xds = sif.sel(lon=slice(min_lon_lat[0], max_lon_lat[0]), lat=slice(min_lon_lat[1], max_lon_lat[1])) # this data can all be downloaded from NASA Goddard here either manually or with wget but you'll need an account on https://disc.gsfc.nasa.gov/: https://pastebin.com/viZckVdn imerg_xds = xr.open_mfdataset('../data/3B-DAY.MS.MRG.3IMERG.201803*.nc4') # spatial subset rainy_imerg_xds = imerg_xds.sel(lon=slice(min_lon_lat[0], max_lon_lat[0]), lat=slice(min_lon_lat[1], max_lon_lat[1])) # I'm not sure the best way to combine these datasets but am trying this combo_xds = xr.combine_by_coords([rainy_imerg_xds, rainy_xds])

1条回答

网友

1楼 · 发布于 2024-06-06 18:00:20

这个documentation from xarray简单地概述了这个问题的解决方案。xarray允许您在多个维度中进行插值，并指定另一个数据集的x和y维度作为输出维度。所以在这种情况下，它是用

# interpolation based on http://xarray.pydata.org/en/stable/interpolation.html
# interpolation can't be done across the chunked dimension so we have to load it all into memory
rainy_sif_xds.load()

#interpolate into the higher resolution grid from IMERG
interp_rainy_sif_xds = rainy_sif_xds.interp(lat=rainy_imerg_xds["lat"], lon=rainy_imerg_xds["lon"])

# visualize the output
rainy_sif_xds.dcSIF.mean(dim='time').hvplot.quadmesh('lon', 'lat', cmap='jet', geo=True, rasterize=True, dynamic=False, width=450).relabel('Initial') +\
interp_rainy_sif_xds.dcSIF.mean(dim='time').hvplot.quadmesh('lon', 'lat', cmap='jet', geo=True, rasterize=True, dynamic=False, width=450).relabel('Interpolated')

# now that our coordinates match, in order to actually merge we need to convert the default CFTimeIndex to datetime to merge dataset with SIF data because the IMERG rainfall dataset was CFTime and the SIF was datetime
rainy_imerg_xds['time'] = rainy_imerg_xds.indexes['time'].to_datetimeindex()

# now the merge can easily be done with
merged_xds = xr.combine_by_coords([rainy_imerg_xds, interp_rainy_sif_xds], coords=['lat', 'lon', 'time'], join="inner")

# now visualize the two datasets together // multiply SIF by 30 because values are so ow
merged_xds.HQprecipitation.rolling(time=7, center=True).sum().mean(dim=('lat', 'lon')).hvplot().relabel('Precip') * \
(merged_xds.dcSIF.mean(dim=('lat', 'lon'))*30).hvplot().relabel('SIF')

相关问题更多 >

编程相关推荐

热门问题

热门文章