import pathlib

NetCDF handling

NetCDF formatted files are much faster to read and write for large datasets. In order to make the most of this, the ScmRun objects have the ability to read and write netCDF files.

import traceback
from tempfile import TemporaryDirectory

import numpy as np
import seaborn as sns
import xarray as xr

from scmdata.netcdf import nc_to_run
from scmdata.run import ScmRun, run_append

/home/docs/checkouts/readthedocs.org/user_builds/scmdata/checkouts/stable/src/scmdata/database/_database.py:9: TqdmWarning: IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html
  import tqdm.autonotebook as tqdman

Helper bits and piecs

temp_directory = TemporaryDirectory()
generator = np.random.default_rng(0)
OUTPUT_DIR = pathlib.Path(temp_directory.name)

OUT_FNAME = OUTPUT_DIR / "out_runs.nc"

def new_timeseries(  # noqa: PLR0913
    n=100,
    count=1,
    model="example",
    scenario="ssp119",
    variable="Surface Temperature",
    unit="K",
    region="World",
    cls=ScmRun,
    **kwargs,
):
    """
    Create an example timeseries
    """
    data = generator.random((n, count)) * np.arange(n)[:, np.newaxis]
    index = 2000 + np.arange(n)
    return cls(
        data,
        columns={
            "model": model,
            "scenario": scenario,
            "variable": variable,
            "region": region,
            "unit": unit,
            **kwargs,
        },
        index=index,
    )

Let’s create an ScmRun which contains a few variables and a number of runs. Such a dataframe would be used to store the results from an ensemble of simple climate model runs.

runs = run_append(
    [
        new_timeseries(
            count=3,
            variable=[
                "Surface Temperature",
                "Atmospheric Concentrations|CO2",
                "Radiative Forcing",
            ],
            unit=["K", "ppm", "W/m^2"],
            run_id=run_id,
        )
        for run_id in range(10)
    ]
)
runs.metadata["source"] = "fake data"
runs

<ScmRun (timeseries: 30, timepoints: 100)>
Time:
	Start: 2000-01-01T00:00:00
	End: 2099-01-01T00:00:00
Meta:
	      model region  run_id scenario   unit                        variable
 example  World       0   ssp119      K             Surface Temperature
 example  World       0   ssp119    ppm  Atmospheric Concentrations|CO2
 example  World       0   ssp119  W/m^2               Radiative Forcing
 example  World       1   ssp119      K             Surface Temperature
 example  World       1   ssp119    ppm  Atmospheric Concentrations|CO2
 example  World       1   ssp119  W/m^2               Radiative Forcing
 example  World       2   ssp119      K             Surface Temperature
 example  World       2   ssp119    ppm  Atmospheric Concentrations|CO2
 example  World       2   ssp119  W/m^2               Radiative Forcing
 example  World       3   ssp119      K             Surface Temperature
example  World       3   ssp119    ppm  Atmospheric Concentrations|CO2
example  World       3   ssp119  W/m^2               Radiative Forcing
example  World       4   ssp119      K             Surface Temperature
example  World       4   ssp119    ppm  Atmospheric Concentrations|CO2
example  World       4   ssp119  W/m^2               Radiative Forcing
example  World       5   ssp119      K             Surface Temperature
example  World       5   ssp119    ppm  Atmospheric Concentrations|CO2
example  World       5   ssp119  W/m^2               Radiative Forcing
example  World       6   ssp119      K             Surface Temperature
example  World       6   ssp119    ppm  Atmospheric Concentrations|CO2
example  World       6   ssp119  W/m^2               Radiative Forcing
example  World       7   ssp119      K             Surface Temperature
example  World       7   ssp119    ppm  Atmospheric Concentrations|CO2
example  World       7   ssp119  W/m^2               Radiative Forcing
example  World       8   ssp119      K             Surface Temperature
example  World       8   ssp119    ppm  Atmospheric Concentrations|CO2
example  World       8   ssp119  W/m^2               Radiative Forcing
example  World       9   ssp119      K             Surface Temperature
example  World       9   ssp119    ppm  Atmospheric Concentrations|CO2
example  World       9   ssp119  W/m^2               Radiative Forcing

Reading/Writing to NetCDF4

Multi-dimensional data

scmdata can also handle having more than one dimension. This can be especially helpful if you have output from a number of models (IAMs), scenarios, regions and runs.

multi_dimensional_run = []

for model in ["AIM", "GCAM", "MESSAGE", "REMIND"]:
    for sce in ["ssp119", "ssp370", "ssp585"]:
        for region in ["World", "R5LAM", "R5MAF", "R5ASIA", "R5OECD", "R5REF"]:
            multi_dimensional_run.extend(
                [
                    new_timeseries(
                        count=3,
                        model=model,
                        scenario=sce,
                        region=region,
                        variable=[
                            "Surface Temperature",
                            "Atmospheric Concentrations|CO2",
                            "Radiative Forcing",
                        ],
                        unit=["K", "ppm", "W/m^2"],
                        paraset_id=paraset_id,
                    )
                    for paraset_id in range(10)
                ]
            )

multi_dimensional_run = run_append(multi_dimensional_run)

multi_dimensional_run

<ScmRun (timeseries: 2160, timepoints: 100)>
Time:
	Start: 2000-01-01T00:00:00
	End: 2099-01-01T00:00:00
Meta:
	       model  paraset_id region scenario   unit  \
	0        AIM           0  World   ssp119      K   
	1        AIM           0  World   ssp119    ppm   
	2        AIM           0  World   ssp119  W/m^2   
	3        AIM           1  World   ssp119      K   
	4        AIM           1  World   ssp119    ppm   
	...      ...         ...    ...      ...    ...   
	2155  REMIND           8  R5REF   ssp585    ppm   
	2156  REMIND           8  R5REF   ssp585  W/m^2   
	2157  REMIND           9  R5REF   ssp585      K   
	2158  REMIND           9  R5REF   ssp585    ppm   
	2159  REMIND           9  R5REF   ssp585  W/m^2   
	
	                            variable  
	0                Surface Temperature  
	1     Atmospheric Concentrations|CO2  
	2                  Radiative Forcing  
	3                Surface Temperature  
	4     Atmospheric Concentrations|CO2  
	...                              ...  
	2155  Atmospheric Concentrations|CO2  
	2156               Radiative Forcing  
	2157             Surface Temperature  
	2158  Atmospheric Concentrations|CO2  
	2159               Radiative Forcing  
	
	[2160 rows x 6 columns]

multi_dim_outfile = OUTPUT_DIR / "out-multi-dimensional.nc"

multi_dimensional_run.to_nc(
    multi_dim_outfile,
    dimensions=("region", "model", "scenario", "paraset_id"),
)

/home/docs/checkouts/readthedocs.org/user_builds/scmdata/checkouts/stable/src/scmdata/_xarray.py:236: FutureWarning: The previous implementation of stack is deprecated and will be removed in a future version of pandas. See the What's New notes for pandas 2.1.0 for details. Specify future_stack=True to adopt the new implementation and silence this warning.
  else timeseries.T.stack(dimensions)

multi_dim_loaded_co2_conc = ScmRun.from_nc(multi_dim_outfile).filter(
    variable="Atmospheric Concentrations|CO2"
)

seaborn_df = multi_dim_loaded_co2_conc.long_data()
seaborn_df.head()

	model	paraset_id	region	scenario	unit	variable	time	value
0	AIM	0	R5ASIA	ssp119	ppm	Atmospheric Concentrations\|CO2	2000-01-01	0.000000
1	AIM	0	R5ASIA	ssp119	ppm	Atmospheric Concentrations\|CO2	2001-01-01	0.730551
2	AIM	0	R5ASIA	ssp119	ppm	Atmospheric Concentrations\|CO2	2002-01-01	0.142061
3	AIM	0	R5ASIA	ssp119	ppm	Atmospheric Concentrations\|CO2	2003-01-01	2.977609
4	AIM	0	R5ASIA	ssp119	ppm	Atmospheric Concentrations\|CO2	2004-01-01	0.785949

sns.relplot(
    data=seaborn_df,
    x="time",
    y="value",
    units="paraset_id",
    estimator=None,
    hue="scenario",
    style="model",
    col="region",
    col_wrap=3,
    kind="line",
)

<seaborn.axisgrid.FacetGrid at 0x7f353ebbc490>

../_images/4bb1339d0487ea8f7538738be0a5eb0e9b549dda7cf92ee68003be2aa72d6bb0.png

Read the Docs v: stable

Versions: latest; stable; v1.0.0; v0.16.1; v0.16.0; v0.15.3; v0.15.2; v0.15.1; v0.15.0; v0.14.2; v0.14.1; v0.14.0; v0.13.2; v0.13.1; v0.13.0; v0.12.1; v0.12.0; v0.11.0

Downloads

On Read the Docs: Project Home; Builds